diff --git "a/wandb/run-20220325_193848-1sz5964i/files/wandb-summary.json" "b/wandb/run-20220325_193848-1sz5964i/files/wandb-summary.json" --- "a/wandb/run-20220325_193848-1sz5964i/files/wandb-summary.json" +++ "b/wandb/run-20220325_193848-1sz5964i/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 4.3539, "train/learning_rate": 0.00029759999999999997, "train/epoch": 2.24, "train/global_step": 500, "_runtime": 11642, "_timestamp": 1648248770, "_step": 500, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 411.0, 609.0], "bins": [-88.30326843261719, -86.90232849121094, -85.50139617919922, -84.10045623779297, -82.69951629638672, -81.298583984375, -79.89764404296875, -78.4967041015625, -77.09576416015625, -75.69482421875, -74.29389190673828, -72.89295196533203, -71.49201202392578, -70.09107971191406, -68.69013977050781, -67.28919982910156, -65.88826751708984, -64.4873275756836, -63.08639144897461, -61.685455322265625, -60.284515380859375, -58.88357925415039, -57.482643127441406, -56.081703186035156, -54.680763244628906, -53.27982711791992, -51.87888717651367, -50.47795104980469, -49.07701110839844, -47.67607498168945, -46.27513885498047, -44.87419891357422, -43.473262786865234, -42.07232666015625, -40.67138671875, -39.270450592041016, -37.869510650634766, -36.46857452392578, -35.06763458251953, -33.66669845581055, -32.26576232910156, -30.864824295043945, -29.463886260986328, -28.062950134277344, -26.662012100219727, -25.26107406616211, -23.860136032104492, -22.459197998046875, -21.058259963989258, -19.65732192993164, -18.256383895874023, -16.855445861816406, -15.454509735107422, -14.053571701049805, -12.652633666992188, -11.251696586608887, -9.850757598876953, -8.449819564819336, -7.048882484436035, -5.647944450378418, -4.247006893157959, -2.8460693359375, -1.4451313018798828, -0.04419422149658203, 1.356743335723877]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 6.0, 3.0, 6.0, 8.0, 5.0, 12.0, 16.0, 24.0, 16.0, 19.0, 18.0, 29.0, 43.0, 38.0, 42.0, 45.0, 40.0, 36.0, 39.0, 55.0, 50.0, 33.0, 50.0, 35.0, 38.0, 34.0, 33.0, 31.0, 25.0, 26.0, 25.0, 25.0, 14.0, 20.0, 11.0, 9.0, 7.0, 7.0, 4.0, 5.0, 2.0, 5.0, 5.0, 3.0, 3.0, 3.0, 0.0, 1.0], "bins": [-3.711008071899414, -3.6036376953125, -3.496267318725586, -3.3888967037200928, -3.2815263271331787, -3.1741559505462646, -3.0667853355407715, -2.9594149589538574, -2.8520445823669434, -2.7446742057800293, -2.6373038291931152, -2.529933214187622, -2.422562837600708, -2.315192461013794, -2.207821846008301, -2.1004514694213867, -1.9930810928344727, -1.8857107162475586, -1.778340220451355, -1.6709697246551514, -1.5635993480682373, -1.4562289714813232, -1.3488584756851196, -1.241487979888916, -1.134117603302002, -1.026747226715088, -0.9193767309188843, -0.8120062947273254, -0.7046358585357666, -0.5972654223442078, -0.4898949861526489, -0.3825245499610901, -0.27515435218811035, -0.1677839159965515, -0.060413479804992676, 0.04695695638656616, 0.154327392578125, 0.26169782876968384, 0.3690682649612427, 0.4764387011528015, 0.5838091373443604, 0.6911795735359192, 0.798550009727478, 0.9059204459190369, 1.0132908821105957, 1.1206612586975098, 1.2280317544937134, 1.335402250289917, 1.442772626876831, 1.5501430034637451, 1.6575134992599487, 1.7648839950561523, 1.8722543716430664, 1.9796247482299805, 2.0869951248168945, 2.1943657398223877, 2.3017361164093018, 2.409106492996216, 2.516477108001709, 2.623847484588623, 2.731217861175537, 2.838588237762451, 2.9459586143493652, 3.0533292293548584, 3.1606996059417725]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 2.0, 2.0, 5.0, 9.0, 1.0, 10.0, 16.0, 11.0, 20.0, 22.0, 52.0, 64.0, 112.0, 259.0, 510.0, 1177.0, 3263.0, 11252.0, 47641.0, 180398.0, 631313.0, 1818733.0, 1076307.0, 305101.0, 82868.0, 23987.0, 7322.0, 2316.0, 778.0, 337.0, 145.0, 81.0, 52.0, 36.0, 22.0, 15.0, 6.0, 13.0, 6.0, 5.0, 5.0, 6.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.49609375, -4.37689208984375, -4.2576904296875, -4.13848876953125, -4.019287109375, -3.90008544921875, -3.7808837890625, -3.66168212890625, -3.54248046875, -3.42327880859375, -3.3040771484375, -3.18487548828125, -3.065673828125, -2.94647216796875, -2.8272705078125, -2.70806884765625, -2.5888671875, -2.46966552734375, -2.3504638671875, -2.23126220703125, -2.112060546875, -1.99285888671875, -1.8736572265625, -1.75445556640625, -1.63525390625, -1.51605224609375, -1.3968505859375, -1.27764892578125, -1.158447265625, -1.03924560546875, -0.9200439453125, -0.80084228515625, -0.681640625, -0.56243896484375, -0.4432373046875, -0.32403564453125, -0.204833984375, -0.08563232421875, 0.0335693359375, 0.15277099609375, 0.27197265625, 0.39117431640625, 0.5103759765625, 0.62957763671875, 0.748779296875, 0.86798095703125, 0.9871826171875, 1.10638427734375, 1.2255859375, 1.34478759765625, 1.4639892578125, 1.58319091796875, 1.702392578125, 1.82159423828125, 1.9407958984375, 2.05999755859375, 2.17919921875, 2.29840087890625, 2.4176025390625, 2.53680419921875, 2.656005859375, 2.77520751953125, 2.8944091796875, 3.01361083984375, 3.1328125]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 2.0, 4.0, 5.0, 1.0, 3.0, 10.0, 9.0, 16.0, 15.0, 20.0, 28.0, 27.0, 28.0, 35.0, 43.0, 49.0, 48.0, 49.0, 42.0, 47.0, 46.0, 41.0, 46.0, 55.0, 45.0, 33.0, 39.0, 33.0, 27.0, 26.0, 22.0, 24.0, 12.0, 13.0, 13.0, 5.0, 7.0, 6.0, 7.0, 5.0, 7.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-4.94140625, -4.809234619140625, -4.67706298828125, -4.544891357421875, -4.4127197265625, -4.280548095703125, -4.14837646484375, -4.016204833984375, -3.884033203125, -3.751861572265625, -3.61968994140625, -3.487518310546875, -3.3553466796875, -3.223175048828125, -3.09100341796875, -2.958831787109375, -2.82666015625, -2.694488525390625, -2.56231689453125, -2.430145263671875, -2.2979736328125, -2.165802001953125, -2.03363037109375, -1.901458740234375, -1.769287109375, -1.637115478515625, -1.50494384765625, -1.372772216796875, -1.2406005859375, -1.108428955078125, -0.97625732421875, -0.844085693359375, -0.7119140625, -0.579742431640625, -0.44757080078125, -0.315399169921875, -0.1832275390625, -0.051055908203125, 0.08111572265625, 0.213287353515625, 0.345458984375, 0.477630615234375, 0.60980224609375, 0.741973876953125, 0.8741455078125, 1.006317138671875, 1.13848876953125, 1.270660400390625, 1.40283203125, 1.535003662109375, 1.66717529296875, 1.799346923828125, 1.9315185546875, 2.063690185546875, 2.19586181640625, 2.328033447265625, 2.460205078125, 2.592376708984375, 2.72454833984375, 2.856719970703125, 2.9888916015625, 3.121063232421875, 3.25323486328125, 3.385406494140625, 3.517578125]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 5.0, 11.0, 15.0, 21.0, 43.0, 67.0, 155.0, 385.0, 2110.0, 4190160.0, 847.0, 243.0, 114.0, 46.0, 26.0, 11.0, 11.0, 5.0, 4.0, 0.0, 1.0, 1.0, 0.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-101.6875, -98.4404296875, -95.193359375, -91.9462890625, -88.69921875, -85.4521484375, -82.205078125, -78.9580078125, -75.7109375, -72.4638671875, -69.216796875, -65.9697265625, -62.72265625, -59.4755859375, -56.228515625, -52.9814453125, -49.734375, -46.4873046875, -43.240234375, -39.9931640625, -36.74609375, -33.4990234375, -30.251953125, -27.0048828125, -23.7578125, -20.5107421875, -17.263671875, -14.0166015625, -10.76953125, -7.5224609375, -4.275390625, -1.0283203125, 2.21875, 5.4658203125, 8.712890625, 11.9599609375, 15.20703125, 18.4541015625, 21.701171875, 24.9482421875, 28.1953125, 31.4423828125, 34.689453125, 37.9365234375, 41.18359375, 44.4306640625, 47.677734375, 50.9248046875, 54.171875, 57.4189453125, 60.666015625, 63.9130859375, 67.16015625, 70.4072265625, 73.654296875, 76.9013671875, 80.1484375, 83.3955078125, 86.642578125, 89.8896484375, 93.13671875, 96.3837890625, 99.630859375, 102.8779296875, 106.125]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 5.0, 10.0, 12.0, 20.0, 32.0, 51.0, 103.0, 248.0, 541.0, 1258.0, 1025.0, 407.0, 170.0, 94.0, 44.0, 28.0, 8.0, 3.0, 10.0, 2.0, 3.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5703125, -2.4842529296875, -2.398193359375, -2.3121337890625, -2.22607421875, -2.1400146484375, -2.053955078125, -1.9678955078125, -1.8818359375, -1.7957763671875, -1.709716796875, -1.6236572265625, -1.53759765625, -1.4515380859375, -1.365478515625, -1.2794189453125, -1.193359375, -1.1072998046875, -1.021240234375, -0.9351806640625, -0.84912109375, -0.7630615234375, -0.677001953125, -0.5909423828125, -0.5048828125, -0.4188232421875, -0.332763671875, -0.2467041015625, -0.16064453125, -0.0745849609375, 0.011474609375, 0.0975341796875, 0.18359375, 0.2696533203125, 0.355712890625, 0.4417724609375, 0.52783203125, 0.6138916015625, 0.699951171875, 0.7860107421875, 0.8720703125, 0.9581298828125, 1.044189453125, 1.1302490234375, 1.21630859375, 1.3023681640625, 1.388427734375, 1.4744873046875, 1.560546875, 1.6466064453125, 1.732666015625, 1.8187255859375, 1.90478515625, 1.9908447265625, 2.076904296875, 2.1629638671875, 2.2490234375, 2.3350830078125, 2.421142578125, 2.5072021484375, 2.59326171875, 2.6793212890625, 2.765380859375, 2.8514404296875, 2.9375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 5.0, 6.0, 10.0, 15.0, 20.0, 49.0, 87.0, 101.0, 141.0, 142.0, 143.0, 92.0, 79.0, 47.0, 31.0, 26.0, 7.0, 10.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0130157470703125, -4.75441312789917, -4.495810508728027, -4.237207889556885, -3.9786055088043213, -3.7200028896331787, -3.4614005088806152, -3.2027978897094727, -2.94419527053833, -2.6855926513671875, -2.426990032196045, -2.1683876514434814, -1.9097850322723389, -1.6511824131011963, -1.3925799131393433, -1.1339774131774902, -0.8753747940063477, -0.6167722344398499, -0.35816967487335205, -0.09956711530685425, 0.15903544425964355, 0.41763806343078613, 0.6762405633926392, 0.9348430633544922, 1.1934456825256348, 1.4520483016967773, 1.7106508016586304, 1.9692533016204834, 2.227855920791626, 2.4864585399627686, 2.745060920715332, 3.0036635398864746, 3.2622671127319336, 3.520869731903076, 3.7794723510742188, 4.038074970245361, 4.296677589416504, 4.555279731750488, 4.813882350921631, 5.072484970092773, 5.331087589263916, 5.589690208435059, 5.848292827606201, 6.106895446777344, 6.365497589111328, 6.624100685119629, 6.882702827453613, 7.141305446624756, 7.399908065795898, 7.658510684967041, 7.917113304138184, 8.175715446472168, 8.434318542480469, 8.692920684814453, 8.951523780822754, 9.210125923156738, 9.468729019165039, 9.727331161499023, 9.985934257507324, 10.244536399841309, 10.50313949584961, 10.761741638183594, 11.020344734191895, 11.278946876525879, 11.537549018859863]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 5.0, 5.0, 5.0, 8.0, 7.0, 10.0, 6.0, 14.0, 19.0, 16.0, 20.0, 21.0, 27.0, 38.0, 40.0, 30.0, 41.0, 43.0, 47.0, 52.0, 46.0, 44.0, 41.0, 44.0, 35.0, 39.0, 31.0, 38.0, 28.0, 38.0, 28.0, 24.0, 20.0, 23.0, 18.0, 10.0, 14.0, 8.0, 7.0, 3.0, 3.0, 6.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.213425636291504, -4.086343765258789, -3.9592621326446533, -3.8321802616119385, -3.7050983905792236, -3.578016757965088, -3.450934886932373, -3.323853015899658, -3.1967711448669434, -3.0696892738342285, -2.9426076412200928, -2.815525770187378, -2.688443899154663, -2.5613622665405273, -2.4342803955078125, -2.3071985244750977, -2.180116891860962, -2.053035020828247, -1.9259532690048218, -1.7988715171813965, -1.6717896461486816, -1.5447078943252563, -1.417626142501831, -1.2905442714691162, -1.163462519645691, -1.0363807678222656, -0.9092988967895508, -0.7822171449661255, -0.6551353335380554, -0.5280535221099854, -0.40097177028656006, -0.27388995885849, -0.14680814743041992, -0.019726350903511047, 0.10735544562339783, 0.2344372272491455, 0.3615190386772156, 0.48860085010528564, 0.6156826019287109, 0.742764413356781, 0.8698462247848511, 0.9969280362129211, 1.1240098476409912, 1.2510915994644165, 1.3781733512878418, 1.5052552223205566, 1.632336974143982, 1.7594187259674072, 1.886500597000122, 2.013582468032837, 2.1406641006469727, 2.2677459716796875, 2.3948278427124023, 2.521909713745117, 2.648991346359253, 2.7760732173919678, 2.9031548500061035, 3.0302367210388184, 3.157318353652954, 3.284400224685669, 3.411482095718384, 3.5385637283325195, 3.6656455993652344, 3.792727470397949, 3.919809341430664]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 9.0, 5.0, 11.0, 15.0, 26.0, 51.0, 67.0, 101.0, 156.0, 322.0, 515.0, 987.0, 2133.0, 4654.0, 11486.0, 30369.0, 84769.0, 211614.0, 327194.0, 225498.0, 93197.0, 33448.0, 12276.0, 5011.0, 2183.0, 1085.0, 554.0, 294.0, 208.0, 128.0, 58.0, 44.0, 31.0, 17.0, 14.0, 8.0, 5.0, 6.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2734375, -1.236572265625, -1.19970703125, -1.162841796875, -1.1259765625, -1.089111328125, -1.05224609375, -1.015380859375, -0.978515625, -0.941650390625, -0.90478515625, -0.867919921875, -0.8310546875, -0.794189453125, -0.75732421875, -0.720458984375, -0.68359375, -0.646728515625, -0.60986328125, -0.572998046875, -0.5361328125, -0.499267578125, -0.46240234375, -0.425537109375, -0.388671875, -0.351806640625, -0.31494140625, -0.278076171875, -0.2412109375, -0.204345703125, -0.16748046875, -0.130615234375, -0.09375, -0.056884765625, -0.02001953125, 0.016845703125, 0.0537109375, 0.090576171875, 0.12744140625, 0.164306640625, 0.201171875, 0.238037109375, 0.27490234375, 0.311767578125, 0.3486328125, 0.385498046875, 0.42236328125, 0.459228515625, 0.49609375, 0.532958984375, 0.56982421875, 0.606689453125, 0.6435546875, 0.680419921875, 0.71728515625, 0.754150390625, 0.791015625, 0.827880859375, 0.86474609375, 0.901611328125, 0.9384765625, 0.975341796875, 1.01220703125, 1.049072265625, 1.0859375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 3.0, 4.0, 6.0, 10.0, 11.0, 5.0, 17.0, 19.0, 31.0, 19.0, 34.0, 35.0, 41.0, 49.0, 50.0, 56.0, 46.0, 52.0, 57.0, 48.0, 54.0, 41.0, 46.0, 47.0, 28.0, 30.0, 32.0, 33.0, 31.0, 23.0, 9.0, 6.0, 5.0, 5.0, 7.0, 3.0, 5.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.48828125, -3.36920166015625, -3.2501220703125, -3.13104248046875, -3.011962890625, -2.89288330078125, -2.7738037109375, -2.65472412109375, -2.53564453125, -2.41656494140625, -2.2974853515625, -2.17840576171875, -2.059326171875, -1.94024658203125, -1.8211669921875, -1.70208740234375, -1.5830078125, -1.46392822265625, -1.3448486328125, -1.22576904296875, -1.106689453125, -0.98760986328125, -0.8685302734375, -0.74945068359375, -0.63037109375, -0.51129150390625, -0.3922119140625, -0.27313232421875, -0.154052734375, -0.03497314453125, 0.0841064453125, 0.20318603515625, 0.322265625, 0.44134521484375, 0.5604248046875, 0.67950439453125, 0.798583984375, 0.91766357421875, 1.0367431640625, 1.15582275390625, 1.27490234375, 1.39398193359375, 1.5130615234375, 1.63214111328125, 1.751220703125, 1.87030029296875, 1.9893798828125, 2.10845947265625, 2.2275390625, 2.34661865234375, 2.4656982421875, 2.58477783203125, 2.703857421875, 2.82293701171875, 2.9420166015625, 3.06109619140625, 3.18017578125, 3.29925537109375, 3.4183349609375, 3.53741455078125, 3.656494140625, 3.77557373046875, 3.8946533203125, 4.01373291015625, 4.1328125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 8.0, 6.0, 3.0, 19.0, 19.0, 42.0, 61.0, 101.0, 180.0, 251.0, 373.0, 717.0, 1229.0, 2344.0, 4573.0, 8816.0, 18243.0, 37369.0, 75220.0, 138485.0, 209258.0, 220547.0, 156528.0, 87709.0, 43818.0, 21162.0, 10191.0, 5267.0, 2624.0, 1500.0, 787.0, 414.0, 254.0, 167.0, 85.0, 60.0, 44.0, 25.0, 16.0, 16.0, 10.0, 4.0, 6.0, 2.0, 4.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.5859375, -0.5682449340820312, -0.5505523681640625, -0.5328598022460938, -0.515167236328125, -0.49747467041015625, -0.4797821044921875, -0.46208953857421875, -0.44439697265625, -0.42670440673828125, -0.4090118408203125, -0.39131927490234375, -0.373626708984375, -0.35593414306640625, -0.3382415771484375, -0.32054901123046875, -0.3028564453125, -0.28516387939453125, -0.2674713134765625, -0.24977874755859375, -0.232086181640625, -0.21439361572265625, -0.1967010498046875, -0.17900848388671875, -0.16131591796875, -0.14362335205078125, -0.1259307861328125, -0.10823822021484375, -0.090545654296875, -0.07285308837890625, -0.0551605224609375, -0.03746795654296875, -0.019775390625, -0.00208282470703125, 0.0156097412109375, 0.03330230712890625, 0.050994873046875, 0.06868743896484375, 0.0863800048828125, 0.10407257080078125, 0.12176513671875, 0.13945770263671875, 0.1571502685546875, 0.17484283447265625, 0.192535400390625, 0.21022796630859375, 0.2279205322265625, 0.24561309814453125, 0.2633056640625, 0.28099822998046875, 0.2986907958984375, 0.31638336181640625, 0.334075927734375, 0.35176849365234375, 0.3694610595703125, 0.38715362548828125, 0.40484619140625, 0.42253875732421875, 0.4402313232421875, 0.45792388916015625, 0.475616455078125, 0.49330902099609375, 0.5110015869140625, 0.5286941528320312, 0.54638671875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 4.0, 2.0, 4.0, 0.0, 6.0, 7.0, 7.0, 19.0, 13.0, 17.0, 22.0, 25.0, 26.0, 35.0, 32.0, 39.0, 39.0, 34.0, 46.0, 45.0, 53.0, 47.0, 47.0, 43.0, 50.0, 44.0, 36.0, 48.0, 27.0, 31.0, 21.0, 28.0, 29.0, 19.0, 14.0, 8.0, 10.0, 8.0, 3.0, 3.0, 5.0, 1.0, 3.0, 2.0, 1.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.23828125, -6.03662109375, -5.8349609375, -5.63330078125, -5.431640625, -5.22998046875, -5.0283203125, -4.82666015625, -4.625, -4.42333984375, -4.2216796875, -4.02001953125, -3.818359375, -3.61669921875, -3.4150390625, -3.21337890625, -3.01171875, -2.81005859375, -2.6083984375, -2.40673828125, -2.205078125, -2.00341796875, -1.8017578125, -1.60009765625, -1.3984375, -1.19677734375, -0.9951171875, -0.79345703125, -0.591796875, -0.39013671875, -0.1884765625, 0.01318359375, 0.21484375, 0.41650390625, 0.6181640625, 0.81982421875, 1.021484375, 1.22314453125, 1.4248046875, 1.62646484375, 1.828125, 2.02978515625, 2.2314453125, 2.43310546875, 2.634765625, 2.83642578125, 3.0380859375, 3.23974609375, 3.44140625, 3.64306640625, 3.8447265625, 4.04638671875, 4.248046875, 4.44970703125, 4.6513671875, 4.85302734375, 5.0546875, 5.25634765625, 5.4580078125, 5.65966796875, 5.861328125, 6.06298828125, 6.2646484375, 6.46630859375, 6.66796875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 8.0, 5.0, 9.0, 13.0, 18.0, 30.0, 53.0, 92.0, 152.0, 257.0, 442.0, 776.0, 1500.0, 3213.0, 7931.0, 23571.0, 92976.0, 410322.0, 386160.0, 85067.0, 22104.0, 7520.0, 2992.0, 1526.0, 740.0, 448.0, 257.0, 136.0, 86.0, 46.0, 40.0, 27.0, 13.0, 11.0, 4.0, 7.0, 4.0, 4.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1925048828125, -0.18700027465820312, -0.18149566650390625, -0.17599105834960938, -0.1704864501953125, -0.16498184204101562, -0.15947723388671875, -0.15397262573242188, -0.148468017578125, -0.14296340942382812, -0.13745880126953125, -0.13195419311523438, -0.1264495849609375, -0.12094497680664062, -0.11544036865234375, -0.10993576049804688, -0.10443115234375, -0.09892654418945312, -0.09342193603515625, -0.08791732788085938, -0.0824127197265625, -0.07690811157226562, -0.07140350341796875, -0.06589889526367188, -0.060394287109375, -0.054889678955078125, -0.04938507080078125, -0.043880462646484375, -0.0383758544921875, -0.032871246337890625, -0.02736663818359375, -0.021862030029296875, -0.016357421875, -0.010852813720703125, -0.00534820556640625, 0.000156402587890625, 0.0056610107421875, 0.011165618896484375, 0.01667022705078125, 0.022174835205078125, 0.027679443359375, 0.033184051513671875, 0.03868865966796875, 0.044193267822265625, 0.0496978759765625, 0.055202484130859375, 0.06070709228515625, 0.06621170043945312, 0.07171630859375, 0.07722091674804688, 0.08272552490234375, 0.08823013305664062, 0.0937347412109375, 0.09923934936523438, 0.10474395751953125, 0.11024856567382812, 0.115753173828125, 0.12125778198242188, 0.12676239013671875, 0.13226699829101562, 0.1377716064453125, 0.14327621459960938, 0.14878082275390625, 0.15428543090820312, 0.1597900390625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 7.0, 2.0, 3.0, 8.0, 7.0, 7.0, 14.0, 8.0, 16.0, 20.0, 32.0, 36.0, 46.0, 64.0, 65.0, 77.0, 77.0, 82.0, 78.0, 67.0, 51.0, 51.0, 34.0, 38.0, 22.0, 11.0, 11.0, 22.0, 7.0, 9.0, 3.0, 10.0, 4.0, 3.0, 2.0, 5.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-9.34600830078125e-05, -9.043421596288681e-05, -8.740834891796112e-05, -8.438248187303543e-05, -8.135661482810974e-05, -7.833074778318405e-05, -7.530488073825836e-05, -7.227901369333267e-05, -6.925314664840698e-05, -6.622727960348129e-05, -6.32014125585556e-05, -6.017554551362991e-05, -5.7149678468704224e-05, -5.4123811423778534e-05, -5.1097944378852844e-05, -4.8072077333927155e-05, -4.5046210289001465e-05, -4.2020343244075775e-05, -3.8994476199150085e-05, -3.5968609154224396e-05, -3.2942742109298706e-05, -2.9916875064373016e-05, -2.6891008019447327e-05, -2.3865140974521637e-05, -2.0839273929595947e-05, -1.7813406884670258e-05, -1.4787539839744568e-05, -1.1761672794818878e-05, -8.735805749893188e-06, -5.709938704967499e-06, -2.684071660041809e-06, 3.417953848838806e-07, 3.3676624298095703e-06, 6.39352947473526e-06, 9.41939651966095e-06, 1.244526356458664e-05, 1.547113060951233e-05, 1.849699765443802e-05, 2.152286469936371e-05, 2.4548731744289398e-05, 2.7574598789215088e-05, 3.060046583414078e-05, 3.362633287906647e-05, 3.665219992399216e-05, 3.967806696891785e-05, 4.2703934013843536e-05, 4.5729801058769226e-05, 4.8755668103694916e-05, 5.1781535148620605e-05, 5.4807402193546295e-05, 5.7833269238471985e-05, 6.0859136283397675e-05, 6.388500332832336e-05, 6.691087037324905e-05, 6.993673741817474e-05, 7.296260446310043e-05, 7.598847150802612e-05, 7.901433855295181e-05, 8.20402055978775e-05, 8.506607264280319e-05, 8.809193968772888e-05, 9.111780673265457e-05, 9.414367377758026e-05, 9.716954082250595e-05, 0.00010019540786743164]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 3.0, 9.0, 8.0, 9.0, 6.0, 7.0, 10.0, 11.0, 12.0, 11.0, 17.0, 31.0, 31.0, 47.0, 60.0, 99.0, 158.0, 294.0, 4471.0, 873077.0, 168055.0, 1404.0, 241.0, 144.0, 84.0, 48.0, 44.0, 23.0, 26.0, 21.0, 18.0, 10.0, 7.0, 8.0, 9.0, 6.0, 4.0, 6.0, 5.0, 3.0, 2.0, 6.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.94580078125, -0.9151382446289062, -0.8844757080078125, -0.8538131713867188, -0.823150634765625, -0.7924880981445312, -0.7618255615234375, -0.7311630249023438, -0.70050048828125, -0.6698379516601562, -0.6391754150390625, -0.6085128784179688, -0.577850341796875, -0.5471878051757812, -0.5165252685546875, -0.48586273193359375, -0.4552001953125, -0.42453765869140625, -0.3938751220703125, -0.36321258544921875, -0.332550048828125, -0.30188751220703125, -0.2712249755859375, -0.24056243896484375, -0.20989990234375, -0.17923736572265625, -0.1485748291015625, -0.11791229248046875, -0.087249755859375, -0.05658721923828125, -0.0259246826171875, 0.00473785400390625, 0.035400390625, 0.06606292724609375, 0.0967254638671875, 0.12738800048828125, 0.158050537109375, 0.18871307373046875, 0.2193756103515625, 0.25003814697265625, 0.28070068359375, 0.31136322021484375, 0.3420257568359375, 0.37268829345703125, 0.403350830078125, 0.43401336669921875, 0.4646759033203125, 0.49533843994140625, 0.5260009765625, 0.5566635131835938, 0.5873260498046875, 0.6179885864257812, 0.648651123046875, 0.6793136596679688, 0.7099761962890625, 0.7406387329101562, 0.77130126953125, 0.8019638061523438, 0.8326263427734375, 0.8632888793945312, 0.893951416015625, 0.9246139526367188, 0.9552764892578125, 0.9859390258789062, 1.0166015625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 4.0, 4.0, 6.0, 9.0, 8.0, 9.0, 11.0, 7.0, 8.0, 7.0, 15.0, 19.0, 18.0, 19.0, 32.0, 36.0, 43.0, 57.0, 67.0, 95.0, 82.0, 68.0, 74.0, 57.0, 42.0, 28.0, 25.0, 25.0, 15.0, 22.0, 19.0, 13.0, 10.0, 9.0, 7.0, 5.0, 5.0, 6.0, 7.0, 0.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.07611083984375, -0.07376575469970703, -0.07142066955566406, -0.0690755844116211, -0.06673049926757812, -0.06438541412353516, -0.06204032897949219, -0.05969524383544922, -0.05735015869140625, -0.05500507354736328, -0.05265998840332031, -0.050314903259277344, -0.047969818115234375, -0.045624732971191406, -0.04327964782714844, -0.04093456268310547, -0.0385894775390625, -0.03624439239501953, -0.03389930725097656, -0.031554222106933594, -0.029209136962890625, -0.026864051818847656, -0.024518966674804688, -0.02217388153076172, -0.01982879638671875, -0.01748371124267578, -0.015138626098632812, -0.012793540954589844, -0.010448455810546875, -0.008103370666503906, -0.0057582855224609375, -0.0034132003784179688, -0.001068115234375, 0.0012769699096679688, 0.0036220550537109375, 0.005967140197753906, 0.008312225341796875, 0.010657310485839844, 0.013002395629882812, 0.015347480773925781, 0.01769256591796875, 0.02003765106201172, 0.022382736206054688, 0.024727821350097656, 0.027072906494140625, 0.029417991638183594, 0.03176307678222656, 0.03410816192626953, 0.0364532470703125, 0.03879833221435547, 0.04114341735839844, 0.043488502502441406, 0.045833587646484375, 0.048178672790527344, 0.05052375793457031, 0.05286884307861328, 0.05521392822265625, 0.05755901336669922, 0.05990409851074219, 0.062249183654785156, 0.06459426879882812, 0.0669393539428711, 0.06928443908691406, 0.07162952423095703, 0.073974609375]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 7.0, 8.0, 19.0, 42.0, 91.0, 196.0, 249.0, 193.0, 96.0, 74.0, 24.0, 12.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.921342849731445, -11.595335960388184, -11.269329071044922, -10.943321228027344, -10.617314338684082, -10.29130744934082, -9.965299606323242, -9.63929271697998, -9.313285827636719, -8.987278938293457, -8.661272048950195, -8.335264205932617, -8.009257316589355, -7.683250427246094, -7.357243061065674, -7.031235694885254, -6.705228805541992, -6.3792219161987305, -6.0532145500183105, -5.727207183837891, -5.401200294494629, -5.075193405151367, -4.749186038970947, -4.423178672790527, -4.097171783447266, -3.771164655685425, -3.445157527923584, -3.119150400161743, -2.7931432723999023, -2.4671361446380615, -2.1411290168762207, -1.8151218891143799, -1.489114761352539, -1.1631076335906982, -0.8371005058288574, -0.5110933780670166, -0.18508625030517578, 0.14092087745666504, 0.46692800521850586, 0.7929351329803467, 1.1189422607421875, 1.4449493885040283, 1.7709565162658691, 2.09696364402771, 2.422970771789551, 2.7489778995513916, 3.0749850273132324, 3.4009921550750732, 3.726999282836914, 4.053006172180176, 4.379013538360596, 4.705020904541016, 5.031027793884277, 5.357034683227539, 5.683042049407959, 6.009049415588379, 6.335056304931641, 6.661063194274902, 6.987070560455322, 7.313077926635742, 7.639084815979004, 7.965091705322266, 8.291099548339844, 8.617106437683105, 8.943113327026367]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 5.0, 1.0, 8.0, 10.0, 6.0, 11.0, 11.0, 20.0, 14.0, 13.0, 26.0, 30.0, 36.0, 38.0, 36.0, 39.0, 48.0, 53.0, 53.0, 42.0, 44.0, 49.0, 49.0, 31.0, 49.0, 34.0, 34.0, 43.0, 26.0, 25.0, 18.0, 23.0, 19.0, 9.0, 11.0, 6.0, 11.0, 6.0, 5.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.1133792400360107, -3.0101258754730225, -2.9068727493286133, -2.803619384765625, -2.7003660202026367, -2.5971126556396484, -2.49385929107666, -2.390606164932251, -2.2873528003692627, -2.1840994358062744, -2.0808463096618652, -1.977592945098877, -1.8743395805358887, -1.7710862159729004, -1.6678329706192017, -1.564579725265503, -1.4613263607025146, -1.3580729961395264, -1.2548197507858276, -1.151566505432129, -1.0483131408691406, -0.9450598359107971, -0.8418065309524536, -0.7385532259941101, -0.6352999210357666, -0.5320466160774231, -0.4287933111190796, -0.3255400061607361, -0.22228670120239258, -0.11903339624404907, -0.015780091285705566, 0.08747321367263794, 0.19072651863098145, 0.29397982358932495, 0.39723312854766846, 0.500486433506012, 0.6037397384643555, 0.706993043422699, 0.8102463483810425, 0.913499653339386, 1.0167529582977295, 1.1200063228607178, 1.2232595682144165, 1.3265128135681152, 1.4297661781311035, 1.5330195426940918, 1.6362727880477905, 1.7395260334014893, 1.8427793979644775, 1.9460327625274658, 2.049285888671875, 2.1525392532348633, 2.2557926177978516, 2.35904598236084, 2.462299346923828, 2.5655524730682373, 2.6688058376312256, 2.772059202194214, 2.875312328338623, 2.9785656929016113, 3.0818190574645996, 3.185072422027588, 3.288325786590576, 3.3915789127349854, 3.4948322772979736]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 6.0, 5.0, 6.0, 8.0, 12.0, 13.0, 25.0, 21.0, 31.0, 56.0, 79.0, 123.0, 234.0, 394.0, 847.0, 1808.0, 4558.0, 15265.0, 97025.0, 707040.0, 187788.0, 22668.0, 6069.0, 2243.0, 1023.0, 525.0, 233.0, 142.0, 107.0, 65.0, 47.0, 27.0, 14.0, 13.0, 10.0, 8.0, 8.0, 7.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.93359375, -2.840850830078125, -2.74810791015625, -2.655364990234375, -2.5626220703125, -2.469879150390625, -2.37713623046875, -2.284393310546875, -2.191650390625, -2.098907470703125, -2.00616455078125, -1.913421630859375, -1.8206787109375, -1.727935791015625, -1.63519287109375, -1.542449951171875, -1.44970703125, -1.356964111328125, -1.26422119140625, -1.171478271484375, -1.0787353515625, -0.985992431640625, -0.89324951171875, -0.800506591796875, -0.707763671875, -0.615020751953125, -0.52227783203125, -0.429534912109375, -0.3367919921875, -0.244049072265625, -0.15130615234375, -0.058563232421875, 0.0341796875, 0.126922607421875, 0.21966552734375, 0.312408447265625, 0.4051513671875, 0.497894287109375, 0.59063720703125, 0.683380126953125, 0.776123046875, 0.868865966796875, 0.96160888671875, 1.054351806640625, 1.1470947265625, 1.239837646484375, 1.33258056640625, 1.425323486328125, 1.51806640625, 1.610809326171875, 1.70355224609375, 1.796295166015625, 1.8890380859375, 1.981781005859375, 2.07452392578125, 2.167266845703125, 2.260009765625, 2.352752685546875, 2.44549560546875, 2.538238525390625, 2.6309814453125, 2.723724365234375, 2.81646728515625, 2.909210205078125, 3.001953125]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 6.0, 5.0, 4.0, 11.0, 10.0, 13.0, 13.0, 21.0, 17.0, 27.0, 22.0, 29.0, 27.0, 23.0, 35.0, 30.0, 45.0, 46.0, 44.0, 48.0, 36.0, 35.0, 46.0, 41.0, 42.0, 46.0, 43.0, 25.0, 28.0, 28.0, 26.0, 27.0, 20.0, 14.0, 14.0, 12.0, 8.0, 8.0, 7.0, 5.0, 3.0, 3.0, 5.0, 2.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.48828125, -5.31494140625, -5.1416015625, -4.96826171875, -4.794921875, -4.62158203125, -4.4482421875, -4.27490234375, -4.1015625, -3.92822265625, -3.7548828125, -3.58154296875, -3.408203125, -3.23486328125, -3.0615234375, -2.88818359375, -2.71484375, -2.54150390625, -2.3681640625, -2.19482421875, -2.021484375, -1.84814453125, -1.6748046875, -1.50146484375, -1.328125, -1.15478515625, -0.9814453125, -0.80810546875, -0.634765625, -0.46142578125, -0.2880859375, -0.11474609375, 0.05859375, 0.23193359375, 0.4052734375, 0.57861328125, 0.751953125, 0.92529296875, 1.0986328125, 1.27197265625, 1.4453125, 1.61865234375, 1.7919921875, 1.96533203125, 2.138671875, 2.31201171875, 2.4853515625, 2.65869140625, 2.83203125, 3.00537109375, 3.1787109375, 3.35205078125, 3.525390625, 3.69873046875, 3.8720703125, 4.04541015625, 4.21875, 4.39208984375, 4.5654296875, 4.73876953125, 4.912109375, 5.08544921875, 5.2587890625, 5.43212890625, 5.60546875]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 8.0, 9.0, 7.0, 21.0, 23.0, 63.0, 139.0, 523.0, 7468.0, 1034318.0, 5264.0, 424.0, 133.0, 61.0, 30.0, 16.0, 13.0, 9.0, 6.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.0078125, -13.4107666015625, -12.813720703125, -12.2166748046875, -11.61962890625, -11.0225830078125, -10.425537109375, -9.8284912109375, -9.2314453125, -8.6343994140625, -8.037353515625, -7.4403076171875, -6.84326171875, -6.2462158203125, -5.649169921875, -5.0521240234375, -4.455078125, -3.8580322265625, -3.260986328125, -2.6639404296875, -2.06689453125, -1.4698486328125, -0.872802734375, -0.2757568359375, 0.3212890625, 0.9183349609375, 1.515380859375, 2.1124267578125, 2.70947265625, 3.3065185546875, 3.903564453125, 4.5006103515625, 5.09765625, 5.6947021484375, 6.291748046875, 6.8887939453125, 7.48583984375, 8.0828857421875, 8.679931640625, 9.2769775390625, 9.8740234375, 10.4710693359375, 11.068115234375, 11.6651611328125, 12.26220703125, 12.8592529296875, 13.456298828125, 14.0533447265625, 14.650390625, 15.2474365234375, 15.844482421875, 16.4415283203125, 17.03857421875, 17.6356201171875, 18.232666015625, 18.8297119140625, 19.4267578125, 20.0238037109375, 20.620849609375, 21.2178955078125, 21.81494140625, 22.4119873046875, 23.009033203125, 23.6060791015625, 24.203125]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 5.0, 2.0, 1.0, 10.0, 3.0, 7.0, 8.0, 12.0, 15.0, 24.0, 25.0, 25.0, 24.0, 29.0, 41.0, 34.0, 40.0, 40.0, 40.0, 45.0, 53.0, 54.0, 51.0, 39.0, 43.0, 35.0, 38.0, 41.0, 26.0, 26.0, 25.0, 25.0, 17.0, 24.0, 19.0, 9.0, 10.0, 10.0, 9.0, 7.0, 7.0, 5.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.89453125, -4.72100830078125, -4.5474853515625, -4.37396240234375, -4.200439453125, -4.02691650390625, -3.8533935546875, -3.67987060546875, -3.50634765625, -3.33282470703125, -3.1593017578125, -2.98577880859375, -2.812255859375, -2.63873291015625, -2.4652099609375, -2.29168701171875, -2.1181640625, -1.94464111328125, -1.7711181640625, -1.59759521484375, -1.424072265625, -1.25054931640625, -1.0770263671875, -0.90350341796875, -0.72998046875, -0.55645751953125, -0.3829345703125, -0.20941162109375, -0.035888671875, 0.13763427734375, 0.3111572265625, 0.48468017578125, 0.658203125, 0.83172607421875, 1.0052490234375, 1.17877197265625, 1.352294921875, 1.52581787109375, 1.6993408203125, 1.87286376953125, 2.04638671875, 2.21990966796875, 2.3934326171875, 2.56695556640625, 2.740478515625, 2.91400146484375, 3.0875244140625, 3.26104736328125, 3.4345703125, 3.60809326171875, 3.7816162109375, 3.95513916015625, 4.128662109375, 4.30218505859375, 4.4757080078125, 4.64923095703125, 4.82275390625, 4.99627685546875, 5.1697998046875, 5.34332275390625, 5.516845703125, 5.69036865234375, 5.8638916015625, 6.03741455078125, 6.2109375]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 3.0, 8.0, 6.0, 13.0, 14.0, 51.0, 130.0, 1821.0, 1044201.0, 2087.0, 134.0, 48.0, 12.0, 11.0, 8.0, 5.0, 3.0, 1.0, 3.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-52.59375, -51.38525390625, -50.1767578125, -48.96826171875, -47.759765625, -46.55126953125, -45.3427734375, -44.13427734375, -42.92578125, -41.71728515625, -40.5087890625, -39.30029296875, -38.091796875, -36.88330078125, -35.6748046875, -34.46630859375, -33.2578125, -32.04931640625, -30.8408203125, -29.63232421875, -28.423828125, -27.21533203125, -26.0068359375, -24.79833984375, -23.58984375, -22.38134765625, -21.1728515625, -19.96435546875, -18.755859375, -17.54736328125, -16.3388671875, -15.13037109375, -13.921875, -12.71337890625, -11.5048828125, -10.29638671875, -9.087890625, -7.87939453125, -6.6708984375, -5.46240234375, -4.25390625, -3.04541015625, -1.8369140625, -0.62841796875, 0.580078125, 1.78857421875, 2.9970703125, 4.20556640625, 5.4140625, 6.62255859375, 7.8310546875, 9.03955078125, 10.248046875, 11.45654296875, 12.6650390625, 13.87353515625, 15.08203125, 16.29052734375, 17.4990234375, 18.70751953125, 19.916015625, 21.12451171875, 22.3330078125, 23.54150390625, 24.75]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 3.0, 2.0, 5.0, 8.0, 30.0, 87.0, 374.0, 359.0, 85.0, 24.0, 12.0, 4.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.0005326271057128906, -0.0005186013877391815, -0.0005045756697654724, -0.0004905499517917633, -0.0004765242338180542, -0.0004624985158443451, -0.000448472797870636, -0.0004344470798969269, -0.0004204213619232178, -0.00040639564394950867, -0.00039236992597579956, -0.00037834420800209045, -0.00036431849002838135, -0.00035029277205467224, -0.00033626705408096313, -0.00032224133610725403, -0.0003082156181335449, -0.0002941899001598358, -0.0002801641821861267, -0.0002661384642124176, -0.0002521127462387085, -0.0002380870282649994, -0.00022406131029129028, -0.00021003559231758118, -0.00019600987434387207, -0.00018198415637016296, -0.00016795843839645386, -0.00015393272042274475, -0.00013990700244903564, -0.00012588128447532654, -0.00011185556650161743, -9.782984852790833e-05, -8.380413055419922e-05, -6.977841258049011e-05, -5.5752694606781006e-05, -4.17269766330719e-05, -2.7701258659362793e-05, -1.3675540685653687e-05, 3.501772880554199e-07, 1.4375895261764526e-05, 2.8401613235473633e-05, 4.242733120918274e-05, 5.6453049182891846e-05, 7.047876715660095e-05, 8.450448513031006e-05, 9.853020310401917e-05, 0.00011255592107772827, 0.00012658163905143738, 0.00014060735702514648, 0.0001546330749988556, 0.0001686587929725647, 0.0001826845109462738, 0.0001967102289199829, 0.00021073594689369202, 0.00022476166486740112, 0.00023878738284111023, 0.00025281310081481934, 0.00026683881878852844, 0.00028086453676223755, 0.00029489025473594666, 0.00030891597270965576, 0.00032294169068336487, 0.000336967408657074, 0.0003509931266307831, 0.0003650188446044922]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 2.0, 2.0, 3.0, 8.0, 10.0, 18.0, 26.0, 50.0, 79.0, 187.0, 553.0, 3899.0, 160926.0, 871772.0, 9569.0, 969.0, 208.0, 113.0, 41.0, 47.0, 18.0, 15.0, 8.0, 8.0, 7.0, 1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.9140625, -2.8415069580078125, -2.768951416015625, -2.6963958740234375, -2.62384033203125, -2.5512847900390625, -2.478729248046875, -2.4061737060546875, -2.3336181640625, -2.2610626220703125, -2.188507080078125, -2.1159515380859375, -2.04339599609375, -1.9708404541015625, -1.898284912109375, -1.8257293701171875, -1.753173828125, -1.6806182861328125, -1.608062744140625, -1.5355072021484375, -1.46295166015625, -1.3903961181640625, -1.317840576171875, -1.2452850341796875, -1.1727294921875, -1.1001739501953125, -1.027618408203125, -0.9550628662109375, -0.88250732421875, -0.8099517822265625, -0.737396240234375, -0.6648406982421875, -0.59228515625, -0.5197296142578125, -0.447174072265625, -0.3746185302734375, -0.30206298828125, -0.2295074462890625, -0.156951904296875, -0.0843963623046875, -0.0118408203125, 0.0607147216796875, 0.133270263671875, 0.2058258056640625, 0.27838134765625, 0.3509368896484375, 0.423492431640625, 0.4960479736328125, 0.568603515625, 0.6411590576171875, 0.713714599609375, 0.7862701416015625, 0.85882568359375, 0.9313812255859375, 1.003936767578125, 1.0764923095703125, 1.1490478515625, 1.2216033935546875, 1.294158935546875, 1.3667144775390625, 1.43927001953125, 1.5118255615234375, 1.584381103515625, 1.6569366455078125, 1.7294921875]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 1.0, 1.0, 1.0, 4.0, 7.0, 2.0, 7.0, 14.0, 24.0, 39.0, 52.0, 86.0, 101.0, 165.0, 156.0, 102.0, 71.0, 52.0, 29.0, 28.0, 15.0, 9.0, 7.0, 4.0, 5.0, 6.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.470947265625, -0.4591102600097656, -0.44727325439453125, -0.4354362487792969, -0.4235992431640625, -0.4117622375488281, -0.39992523193359375, -0.3880882263183594, -0.376251220703125, -0.3644142150878906, -0.35257720947265625, -0.3407402038574219, -0.3289031982421875, -0.3170661926269531, -0.30522918701171875, -0.2933921813964844, -0.28155517578125, -0.2697181701660156, -0.25788116455078125, -0.24604415893554688, -0.2342071533203125, -0.22237014770507812, -0.21053314208984375, -0.19869613647460938, -0.186859130859375, -0.17502212524414062, -0.16318511962890625, -0.15134811401367188, -0.1395111083984375, -0.12767410278320312, -0.11583709716796875, -0.10400009155273438, -0.0921630859375, -0.08032608032226562, -0.06848907470703125, -0.056652069091796875, -0.0448150634765625, -0.032978057861328125, -0.02114105224609375, -0.009304046630859375, 0.002532958984375, 0.014369964599609375, 0.02620697021484375, 0.038043975830078125, 0.0498809814453125, 0.061717987060546875, 0.07355499267578125, 0.08539199829101562, 0.09722900390625, 0.10906600952148438, 0.12090301513671875, 0.13274002075195312, 0.1445770263671875, 0.15641403198242188, 0.16825103759765625, 0.18008804321289062, 0.191925048828125, 0.20376205444335938, 0.21559906005859375, 0.22743606567382812, 0.2392730712890625, 0.2511100769042969, 0.26294708251953125, 0.2747840881347656, 0.28662109375]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 22.0, 962.0, 37.0], "bins": [-257.7974853515625, -253.67599487304688, -249.5544891357422, -245.43299865722656, -241.31150817871094, -237.19000244140625, -233.06851196289062, -228.947021484375, -224.82553100585938, -220.70404052734375, -216.58253479003906, -212.46104431152344, -208.3395538330078, -204.21804809570312, -200.0965576171875, -195.97506713867188, -191.8535614013672, -187.73207092285156, -183.61056518554688, -179.48907470703125, -175.36758422851562, -171.24609375, -167.1245880126953, -163.0030975341797, -158.881591796875, -154.76010131835938, -150.6385955810547, -146.51710510253906, -142.39561462402344, -138.27410888671875, -134.15261840820312, -130.0311279296875, -125.90962982177734, -121.78813171386719, -117.66664123535156, -113.5451431274414, -109.42364501953125, -105.30215454101562, -101.18065643310547, -97.05915832519531, -92.93766784667969, -88.81616973876953, -84.6946792602539, -80.57318115234375, -76.45169067382812, -72.33019256591797, -68.20869445800781, -64.08720397949219, -59.96570587158203, -55.84421157836914, -51.72271728515625, -47.601219177246094, -43.4797248840332, -39.35823059082031, -35.236732482910156, -31.115238189697266, -26.993743896484375, -22.872249603271484, -18.75075340270996, -14.629258155822754, -10.507762908935547, -6.386268615722656, -2.264772415161133, 1.8567237854003906, 5.978218078613281]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 2.0, 6.0, 2.0, 5.0, 1.0, 7.0, 9.0, 10.0, 15.0, 11.0, 16.0, 15.0, 24.0, 17.0, 23.0, 28.0, 27.0, 35.0, 36.0, 35.0, 29.0, 32.0, 35.0, 39.0, 41.0, 36.0, 45.0, 44.0, 34.0, 37.0, 33.0, 30.0, 31.0, 30.0, 27.0, 26.0, 26.0, 18.0, 16.0, 9.0, 11.0, 13.0, 5.0, 6.0, 10.0, 8.0, 6.0, 2.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-8.181455612182617, -7.926083087921143, -7.670711040496826, -7.415338516235352, -7.159965991973877, -6.904593467712402, -6.649221420288086, -6.393848896026611, -6.138476371765137, -5.883103847503662, -5.627731800079346, -5.372359275817871, -5.1169867515563965, -4.861614227294922, -4.6062421798706055, -4.350869655609131, -4.0954976081848145, -3.840125322341919, -3.5847527980804443, -3.329380512237549, -3.074007987976074, -2.8186357021331787, -2.563263416290283, -2.3078908920288086, -2.052518606185913, -1.797146201133728, -1.541773796081543, -1.2864015102386475, -1.0310291051864624, -0.7756567001342773, -0.5202844142913818, -0.2649120092391968, -0.009539604187011719, 0.24583277106285095, 0.5012051463127136, 0.7565774917602539, 1.011949896812439, 1.267322301864624, 1.5226945877075195, 1.7780669927597046, 2.0334393978118896, 2.288811683654785, 2.5441842079162598, 2.7995564937591553, 3.054928779602051, 3.3103013038635254, 3.565673589706421, 3.8210458755493164, 4.076418399810791, 4.331790924072266, 4.587162971496582, 4.842535495758057, 5.097908020019531, 5.353280067443848, 5.608652591705322, 5.864025115966797, 6.119397163391113, 6.374769687652588, 6.630141735076904, 6.885514259338379, 7.1408867835998535, 7.396259307861328, 7.6516313552856445, 7.907003879547119, 8.162376403808594]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 9.0, 5.0, 4.0, 10.0, 12.0, 14.0, 20.0, 23.0, 24.0, 25.0, 44.0, 78.0, 91.0, 135.0, 188.0, 333.0, 628.0, 1301.0, 3654.0, 11888.0, 58063.0, 401291.0, 1981412.0, 1450947.0, 233486.0, 36864.0, 8664.0, 2704.0, 1098.0, 486.0, 293.0, 178.0, 88.0, 60.0, 39.0, 23.0, 26.0, 12.0, 16.0, 11.0, 9.0, 9.0, 4.0, 3.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 3.0, 0.0, 3.0, 1.0], "bins": [-5.0, -4.84783935546875, -4.6956787109375, -4.54351806640625, -4.391357421875, -4.23919677734375, -4.0870361328125, -3.93487548828125, -3.78271484375, -3.63055419921875, -3.4783935546875, -3.32623291015625, -3.174072265625, -3.02191162109375, -2.8697509765625, -2.71759033203125, -2.5654296875, -2.41326904296875, -2.2611083984375, -2.10894775390625, -1.956787109375, -1.80462646484375, -1.6524658203125, -1.50030517578125, -1.34814453125, -1.19598388671875, -1.0438232421875, -0.89166259765625, -0.739501953125, -0.58734130859375, -0.4351806640625, -0.28302001953125, -0.130859375, 0.02130126953125, 0.1734619140625, 0.32562255859375, 0.477783203125, 0.62994384765625, 0.7821044921875, 0.93426513671875, 1.08642578125, 1.23858642578125, 1.3907470703125, 1.54290771484375, 1.695068359375, 1.84722900390625, 1.9993896484375, 2.15155029296875, 2.3037109375, 2.45587158203125, 2.6080322265625, 2.76019287109375, 2.912353515625, 3.06451416015625, 3.2166748046875, 3.36883544921875, 3.52099609375, 3.67315673828125, 3.8253173828125, 3.97747802734375, 4.129638671875, 4.28179931640625, 4.4339599609375, 4.58612060546875, 4.73828125]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 7.0, 4.0, 9.0, 11.0, 11.0, 9.0, 8.0, 23.0, 25.0, 23.0, 24.0, 43.0, 38.0, 48.0, 43.0, 51.0, 61.0, 56.0, 50.0, 64.0, 60.0, 36.0, 54.0, 48.0, 31.0, 26.0, 30.0, 24.0, 26.0, 14.0, 11.0, 9.0, 8.0, 6.0, 8.0, 5.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.513671875, -3.4078369140625, -3.302001953125, -3.1961669921875, -3.09033203125, -2.9844970703125, -2.878662109375, -2.7728271484375, -2.6669921875, -2.5611572265625, -2.455322265625, -2.3494873046875, -2.24365234375, -2.1378173828125, -2.031982421875, -1.9261474609375, -1.8203125, -1.7144775390625, -1.608642578125, -1.5028076171875, -1.39697265625, -1.2911376953125, -1.185302734375, -1.0794677734375, -0.9736328125, -0.8677978515625, -0.761962890625, -0.6561279296875, -0.55029296875, -0.4444580078125, -0.338623046875, -0.2327880859375, -0.126953125, -0.0211181640625, 0.084716796875, 0.1905517578125, 0.29638671875, 0.4022216796875, 0.508056640625, 0.6138916015625, 0.7197265625, 0.8255615234375, 0.931396484375, 1.0372314453125, 1.14306640625, 1.2489013671875, 1.354736328125, 1.4605712890625, 1.56640625, 1.6722412109375, 1.778076171875, 1.8839111328125, 1.98974609375, 2.0955810546875, 2.201416015625, 2.3072509765625, 2.4130859375, 2.5189208984375, 2.624755859375, 2.7305908203125, 2.83642578125, 2.9422607421875, 3.048095703125, 3.1539306640625, 3.259765625]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 5.0, 3.0, 7.0, 11.0, 13.0, 47.0, 130.0, 856.0, 4088763.0, 103864.0, 438.0, 85.0, 31.0, 13.0, 11.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.5625, -15.166015625, -13.76953125, -12.373046875, -10.9765625, -9.580078125, -8.18359375, -6.787109375, -5.390625, -3.994140625, -2.59765625, -1.201171875, 0.1953125, 1.591796875, 2.98828125, 4.384765625, 5.78125, 7.177734375, 8.57421875, 9.970703125, 11.3671875, 12.763671875, 14.16015625, 15.556640625, 16.953125, 18.349609375, 19.74609375, 21.142578125, 22.5390625, 23.935546875, 25.33203125, 26.728515625, 28.125, 29.521484375, 30.91796875, 32.314453125, 33.7109375, 35.107421875, 36.50390625, 37.900390625, 39.296875, 40.693359375, 42.08984375, 43.486328125, 44.8828125, 46.279296875, 47.67578125, 49.072265625, 50.46875, 51.865234375, 53.26171875, 54.658203125, 56.0546875, 57.451171875, 58.84765625, 60.244140625, 61.640625, 63.037109375, 64.43359375, 65.830078125, 67.2265625, 68.623046875, 70.01953125, 71.416015625, 72.8125]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 4.0, 4.0, 3.0, 3.0, 4.0, 4.0, 8.0, 6.0, 13.0, 15.0, 22.0, 29.0, 51.0, 45.0, 94.0, 138.0, 175.0, 271.0, 368.0, 535.0, 541.0, 508.0, 404.0, 250.0, 171.0, 119.0, 73.0, 59.0, 42.0, 26.0, 23.0, 21.0, 9.0, 10.0, 7.0, 3.0, 3.0, 8.0, 5.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.5595703125, -1.5128326416015625, -1.466094970703125, -1.4193572998046875, -1.37261962890625, -1.3258819580078125, -1.279144287109375, -1.2324066162109375, -1.1856689453125, -1.1389312744140625, -1.092193603515625, -1.0454559326171875, -0.99871826171875, -0.9519805908203125, -0.905242919921875, -0.8585052490234375, -0.811767578125, -0.7650299072265625, -0.718292236328125, -0.6715545654296875, -0.62481689453125, -0.5780792236328125, -0.531341552734375, -0.4846038818359375, -0.4378662109375, -0.3911285400390625, -0.344390869140625, -0.2976531982421875, -0.25091552734375, -0.2041778564453125, -0.157440185546875, -0.1107025146484375, -0.06396484375, -0.0172271728515625, 0.029510498046875, 0.0762481689453125, 0.12298583984375, 0.1697235107421875, 0.216461181640625, 0.2631988525390625, 0.3099365234375, 0.3566741943359375, 0.403411865234375, 0.4501495361328125, 0.49688720703125, 0.5436248779296875, 0.590362548828125, 0.6371002197265625, 0.683837890625, 0.7305755615234375, 0.777313232421875, 0.8240509033203125, 0.87078857421875, 0.9175262451171875, 0.964263916015625, 1.0110015869140625, 1.0577392578125, 1.1044769287109375, 1.151214599609375, 1.1979522705078125, 1.24468994140625, 1.2914276123046875, 1.338165283203125, 1.3849029541015625, 1.431640625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 9.0, 29.0, 47.0, 114.0, 208.0, 266.0, 164.0, 103.0, 47.0, 17.0, 5.0, 2.0, 2.0], "bins": [-23.95665740966797, -23.531173706054688, -23.105688095092773, -22.680204391479492, -22.254718780517578, -21.829235076904297, -21.403751373291016, -20.9782657623291, -20.55278205871582, -20.12729835510254, -19.701812744140625, -19.276329040527344, -18.85084342956543, -18.42535972595215, -17.999874114990234, -17.574390411376953, -17.14890480041504, -16.723421096801758, -16.297935485839844, -15.872451782226562, -15.446967124938965, -15.021482467651367, -14.59599781036377, -14.170513153076172, -13.74502944946289, -13.319544792175293, -12.894060134887695, -12.468576431274414, -12.043091773986816, -11.617607116699219, -11.192122459411621, -10.766637802124023, -10.341154098510742, -9.915669441223145, -9.490184783935547, -9.064701080322266, -8.639216423034668, -8.21373176574707, -7.788247108459473, -7.362762451171875, -6.937277793884277, -6.51179313659668, -6.08630895614624, -5.660824298858643, -5.235339641571045, -4.8098554611206055, -4.384370803833008, -3.95888614654541, -3.5334014892578125, -3.107917070388794, -2.6824324131011963, -2.2569479942321777, -1.8314634561538696, -1.4059789180755615, -0.980494499206543, -0.5550098419189453, -0.12952542304992676, 0.29595908522605896, 0.7214435935020447, 1.146928071975708, 1.5724126100540161, 1.9978971481323242, 2.4233815670013428, 2.8488662242889404, 3.274350643157959]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 3.0, 12.0, 11.0, 13.0, 10.0, 19.0, 22.0, 23.0, 29.0, 29.0, 35.0, 29.0, 31.0, 34.0, 38.0, 37.0, 53.0, 45.0, 36.0, 48.0, 45.0, 35.0, 39.0, 43.0, 41.0, 26.0, 33.0, 25.0, 38.0, 24.0, 22.0, 17.0, 16.0, 11.0, 9.0, 4.0, 8.0, 10.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-3.8913259506225586, -3.787609100341797, -3.683892011642456, -3.5801749229431152, -3.4764580726623535, -3.372741222381592, -3.269024133682251, -3.16530704498291, -3.0615901947021484, -2.9578733444213867, -2.854156255722046, -2.750439167022705, -2.6467223167419434, -2.5430054664611816, -2.439288377761841, -2.3355712890625, -2.2318544387817383, -2.1281375885009766, -2.0244204998016357, -1.9207035303115845, -1.8169865608215332, -1.713269591331482, -1.6095526218414307, -1.5058356523513794, -1.4021186828613281, -1.2984017133712769, -1.1946847438812256, -1.0909677743911743, -0.987250804901123, -0.8835338354110718, -0.7798168659210205, -0.6760998964309692, -0.5723831653594971, -0.4686661958694458, -0.36494922637939453, -0.26123225688934326, -0.157515287399292, -0.05379831790924072, 0.04991865158081055, 0.15363562107086182, 0.2573525905609131, 0.36106956005096436, 0.4647865295410156, 0.5685034990310669, 0.6722204685211182, 0.7759374380111694, 0.8796544075012207, 0.983371376991272, 1.0870883464813232, 1.1908053159713745, 1.2945222854614258, 1.398239254951477, 1.5019562244415283, 1.6056731939315796, 1.7093901634216309, 1.8131071329116821, 1.9168241024017334, 2.020541191101074, 2.124258041381836, 2.2279748916625977, 2.3316919803619385, 2.4354090690612793, 2.539125919342041, 2.6428427696228027, 2.7465598583221436]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 7.0, 6.0, 2.0, 4.0, 12.0, 14.0, 25.0, 44.0, 59.0, 101.0, 161.0, 240.0, 352.0, 594.0, 902.0, 1493.0, 3124.0, 7498.0, 21355.0, 71775.0, 234250.0, 401246.0, 209934.0, 62625.0, 19195.0, 6772.0, 2895.0, 1510.0, 882.0, 537.0, 327.0, 231.0, 145.0, 82.0, 45.0, 34.0, 27.0, 17.0, 7.0, 10.0, 6.0, 6.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8017578125, -0.7735748291015625, -0.745391845703125, -0.7172088623046875, -0.68902587890625, -0.6608428955078125, -0.632659912109375, -0.6044769287109375, -0.5762939453125, -0.5481109619140625, -0.519927978515625, -0.4917449951171875, -0.46356201171875, -0.4353790283203125, -0.407196044921875, -0.3790130615234375, -0.350830078125, -0.3226470947265625, -0.294464111328125, -0.2662811279296875, -0.23809814453125, -0.2099151611328125, -0.181732177734375, -0.1535491943359375, -0.1253662109375, -0.0971832275390625, -0.069000244140625, -0.0408172607421875, -0.01263427734375, 0.0155487060546875, 0.043731689453125, 0.0719146728515625, 0.10009765625, 0.1282806396484375, 0.156463623046875, 0.1846466064453125, 0.21282958984375, 0.2410125732421875, 0.269195556640625, 0.2973785400390625, 0.3255615234375, 0.3537445068359375, 0.381927490234375, 0.4101104736328125, 0.43829345703125, 0.4664764404296875, 0.494659423828125, 0.5228424072265625, 0.551025390625, 0.5792083740234375, 0.607391357421875, 0.6355743408203125, 0.66375732421875, 0.6919403076171875, 0.720123291015625, 0.7483062744140625, 0.7764892578125, 0.8046722412109375, 0.832855224609375, 0.8610382080078125, 0.88922119140625, 0.9174041748046875, 0.945587158203125, 0.9737701416015625, 1.001953125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 1.0, 11.0, 9.0, 14.0, 21.0, 23.0, 18.0, 27.0, 14.0, 39.0, 46.0, 44.0, 35.0, 46.0, 58.0, 50.0, 55.0, 43.0, 34.0, 51.0, 39.0, 49.0, 49.0, 47.0, 34.0, 26.0, 27.0, 20.0, 22.0, 13.0, 15.0, 11.0, 3.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.4453125, -3.354278564453125, -3.26324462890625, -3.172210693359375, -3.0811767578125, -2.990142822265625, -2.89910888671875, -2.808074951171875, -2.717041015625, -2.626007080078125, -2.53497314453125, -2.443939208984375, -2.3529052734375, -2.261871337890625, -2.17083740234375, -2.079803466796875, -1.98876953125, -1.897735595703125, -1.80670166015625, -1.715667724609375, -1.6246337890625, -1.533599853515625, -1.44256591796875, -1.351531982421875, -1.260498046875, -1.169464111328125, -1.07843017578125, -0.987396240234375, -0.8963623046875, -0.805328369140625, -0.71429443359375, -0.623260498046875, -0.5322265625, -0.441192626953125, -0.35015869140625, -0.259124755859375, -0.1680908203125, -0.077056884765625, 0.01397705078125, 0.105010986328125, 0.196044921875, 0.287078857421875, 0.37811279296875, 0.469146728515625, 0.5601806640625, 0.651214599609375, 0.74224853515625, 0.833282470703125, 0.92431640625, 1.015350341796875, 1.10638427734375, 1.197418212890625, 1.2884521484375, 1.379486083984375, 1.47052001953125, 1.561553955078125, 1.652587890625, 1.743621826171875, 1.83465576171875, 1.925689697265625, 2.0167236328125, 2.107757568359375, 2.19879150390625, 2.289825439453125, 2.380859375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 7.0, 12.0, 10.0, 13.0, 17.0, 32.0, 43.0, 49.0, 100.0, 149.0, 234.0, 311.0, 494.0, 776.0, 1235.0, 1977.0, 2971.0, 4955.0, 7897.0, 13002.0, 21132.0, 34311.0, 55827.0, 85476.0, 121940.0, 152894.0, 157373.0, 130364.0, 92786.0, 61833.0, 38348.0, 23740.0, 14352.0, 9006.0, 5482.0, 3401.0, 2095.0, 1391.0, 901.0, 567.0, 367.0, 235.0, 144.0, 96.0, 64.0, 48.0, 31.0, 27.0, 15.0, 8.0, 5.0, 6.0, 7.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.228759765625, -0.22062301635742188, -0.21248626708984375, -0.20434951782226562, -0.1962127685546875, -0.18807601928710938, -0.17993927001953125, -0.17180252075195312, -0.163665771484375, -0.15552902221679688, -0.14739227294921875, -0.13925552368164062, -0.1311187744140625, -0.12298202514648438, -0.11484527587890625, -0.10670852661132812, -0.09857177734375, -0.09043502807617188, -0.08229827880859375, -0.07416152954101562, -0.0660247802734375, -0.057888031005859375, -0.04975128173828125, -0.041614532470703125, -0.033477783203125, -0.025341033935546875, -0.01720428466796875, -0.009067535400390625, -0.0009307861328125, 0.007205963134765625, 0.01534271240234375, 0.023479461669921875, 0.0316162109375, 0.039752960205078125, 0.04788970947265625, 0.056026458740234375, 0.0641632080078125, 0.07229995727539062, 0.08043670654296875, 0.08857345581054688, 0.096710205078125, 0.10484695434570312, 0.11298370361328125, 0.12112045288085938, 0.1292572021484375, 0.13739395141601562, 0.14553070068359375, 0.15366744995117188, 0.16180419921875, 0.16994094848632812, 0.17807769775390625, 0.18621444702148438, 0.1943511962890625, 0.20248794555664062, 0.21062469482421875, 0.21876144409179688, 0.226898193359375, 0.23503494262695312, 0.24317169189453125, 0.2513084411621094, 0.2594451904296875, 0.2675819396972656, 0.27571868896484375, 0.2838554382324219, 0.2919921875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 8.0, 5.0, 3.0, 7.0, 10.0, 10.0, 9.0, 14.0, 11.0, 22.0, 24.0, 28.0, 34.0, 38.0, 46.0, 30.0, 41.0, 38.0, 39.0, 37.0, 33.0, 39.0, 46.0, 31.0, 39.0, 38.0, 38.0, 31.0, 36.0, 27.0, 36.0, 20.0, 18.0, 19.0, 20.0, 12.0, 13.0, 13.0, 9.0, 5.0, 7.0, 8.0, 3.0, 3.0, 1.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3125, -4.1759033203125, -4.039306640625, -3.9027099609375, -3.76611328125, -3.6295166015625, -3.492919921875, -3.3563232421875, -3.2197265625, -3.0831298828125, -2.946533203125, -2.8099365234375, -2.67333984375, -2.5367431640625, -2.400146484375, -2.2635498046875, -2.126953125, -1.9903564453125, -1.853759765625, -1.7171630859375, -1.58056640625, -1.4439697265625, -1.307373046875, -1.1707763671875, -1.0341796875, -0.8975830078125, -0.760986328125, -0.6243896484375, -0.48779296875, -0.3511962890625, -0.214599609375, -0.0780029296875, 0.05859375, 0.1951904296875, 0.331787109375, 0.4683837890625, 0.60498046875, 0.7415771484375, 0.878173828125, 1.0147705078125, 1.1513671875, 1.2879638671875, 1.424560546875, 1.5611572265625, 1.69775390625, 1.8343505859375, 1.970947265625, 2.1075439453125, 2.244140625, 2.3807373046875, 2.517333984375, 2.6539306640625, 2.79052734375, 2.9271240234375, 3.063720703125, 3.2003173828125, 3.3369140625, 3.4735107421875, 3.610107421875, 3.7467041015625, 3.88330078125, 4.0198974609375, 4.156494140625, 4.2930908203125, 4.4296875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 8.0, 7.0, 9.0, 8.0, 16.0, 18.0, 22.0, 28.0, 45.0, 77.0, 136.0, 194.0, 341.0, 694.0, 1530.0, 4026.0, 13241.0, 67639.0, 420819.0, 444546.0, 73665.0, 14122.0, 4087.0, 1585.0, 734.0, 359.0, 211.0, 109.0, 80.0, 62.0, 31.0, 23.0, 22.0, 13.0, 10.0, 19.0, 3.0, 6.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09649658203125, -0.09305286407470703, -0.08960914611816406, -0.0861654281616211, -0.08272171020507812, -0.07927799224853516, -0.07583427429199219, -0.07239055633544922, -0.06894683837890625, -0.06550312042236328, -0.06205940246582031, -0.058615684509277344, -0.055171966552734375, -0.051728248596191406, -0.04828453063964844, -0.04484081268310547, -0.0413970947265625, -0.03795337677001953, -0.03450965881347656, -0.031065940856933594, -0.027622222900390625, -0.024178504943847656, -0.020734786987304688, -0.01729106903076172, -0.01384735107421875, -0.010403633117675781, -0.0069599151611328125, -0.0035161972045898438, -7.2479248046875e-05, 0.0033712387084960938, 0.0068149566650390625, 0.010258674621582031, 0.013702392578125, 0.01714611053466797, 0.020589828491210938, 0.024033546447753906, 0.027477264404296875, 0.030920982360839844, 0.03436470031738281, 0.03780841827392578, 0.04125213623046875, 0.04469585418701172, 0.04813957214355469, 0.051583290100097656, 0.055027008056640625, 0.058470726013183594, 0.06191444396972656, 0.06535816192626953, 0.0688018798828125, 0.07224559783935547, 0.07568931579589844, 0.0791330337524414, 0.08257675170898438, 0.08602046966552734, 0.08946418762207031, 0.09290790557861328, 0.09635162353515625, 0.09979534149169922, 0.10323905944824219, 0.10668277740478516, 0.11012649536132812, 0.1135702133178711, 0.11701393127441406, 0.12045764923095703, 0.1239013671875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 5.0, 4.0, 5.0, 12.0, 15.0, 26.0, 30.0, 51.0, 81.0, 120.0, 120.0, 137.0, 110.0, 79.0, 89.0, 36.0, 26.0, 26.0, 12.0, 11.0, 6.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00010401010513305664, -0.0001013539731502533, -9.869784116744995e-05, -9.60417091846466e-05, -9.338557720184326e-05, -9.072944521903992e-05, -8.807331323623657e-05, -8.541718125343323e-05, -8.276104927062988e-05, -8.010491728782654e-05, -7.74487853050232e-05, -7.479265332221985e-05, -7.21365213394165e-05, -6.948038935661316e-05, -6.682425737380981e-05, -6.416812539100647e-05, -6.151199340820312e-05, -5.885586142539978e-05, -5.6199729442596436e-05, -5.354359745979309e-05, -5.0887465476989746e-05, -4.82313334941864e-05, -4.557520151138306e-05, -4.291906952857971e-05, -4.026293754577637e-05, -3.760680556297302e-05, -3.495067358016968e-05, -3.229454159736633e-05, -2.9638409614562988e-05, -2.6982277631759644e-05, -2.43261456489563e-05, -2.1670013666152954e-05, -1.901388168334961e-05, -1.6357749700546265e-05, -1.370161771774292e-05, -1.1045485734939575e-05, -8.38935375213623e-06, -5.733221769332886e-06, -3.077089786529541e-06, -4.209578037261963e-07, 2.2351741790771484e-06, 4.891306161880493e-06, 7.547438144683838e-06, 1.0203570127487183e-05, 1.2859702110290527e-05, 1.5515834093093872e-05, 1.8171966075897217e-05, 2.082809805870056e-05, 2.3484230041503906e-05, 2.614036202430725e-05, 2.8796494007110596e-05, 3.145262598991394e-05, 3.4108757972717285e-05, 3.676488995552063e-05, 3.9421021938323975e-05, 4.207715392112732e-05, 4.4733285903930664e-05, 4.738941788673401e-05, 5.0045549869537354e-05, 5.27016818523407e-05, 5.535781383514404e-05, 5.801394581794739e-05, 6.067007780075073e-05, 6.332620978355408e-05, 6.598234176635742e-05]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 5.0, 2.0, 3.0, 4.0, 4.0, 4.0, 18.0, 4.0, 7.0, 15.0, 37.0, 95.0, 306.0, 1336.0, 25212.0, 995064.0, 24425.0, 1493.0, 309.0, 100.0, 39.0, 21.0, 12.0, 18.0, 5.0, 5.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.337890625, -0.32350921630859375, -0.3091278076171875, -0.29474639892578125, -0.280364990234375, -0.26598358154296875, -0.2516021728515625, -0.23722076416015625, -0.22283935546875, -0.20845794677734375, -0.1940765380859375, -0.17969512939453125, -0.165313720703125, -0.15093231201171875, -0.1365509033203125, -0.12216949462890625, -0.1077880859375, -0.09340667724609375, -0.0790252685546875, -0.06464385986328125, -0.050262451171875, -0.03588104248046875, -0.0214996337890625, -0.00711822509765625, 0.00726318359375, 0.02164459228515625, 0.0360260009765625, 0.05040740966796875, 0.064788818359375, 0.07917022705078125, 0.0935516357421875, 0.10793304443359375, 0.122314453125, 0.13669586181640625, 0.1510772705078125, 0.16545867919921875, 0.179840087890625, 0.19422149658203125, 0.2086029052734375, 0.22298431396484375, 0.23736572265625, 0.25174713134765625, 0.2661285400390625, 0.28050994873046875, 0.294891357421875, 0.30927276611328125, 0.3236541748046875, 0.33803558349609375, 0.3524169921875, 0.36679840087890625, 0.3811798095703125, 0.39556121826171875, 0.409942626953125, 0.42432403564453125, 0.4387054443359375, 0.45308685302734375, 0.46746826171875, 0.48184967041015625, 0.4962310791015625, 0.5106124877929688, 0.524993896484375, 0.5393753051757812, 0.5537567138671875, 0.5681381225585938, 0.58251953125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 6.0, 9.0, 10.0, 24.0, 46.0, 67.0, 104.0, 162.0, 179.0, 130.0, 95.0, 65.0, 49.0, 15.0, 10.0, 6.0, 5.0, 7.0, 2.0, 1.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07635498046875, -0.07419109344482422, -0.07202720642089844, -0.06986331939697266, -0.06769943237304688, -0.0655355453491211, -0.06337165832519531, -0.06120777130126953, -0.05904388427734375, -0.05687999725341797, -0.05471611022949219, -0.052552223205566406, -0.050388336181640625, -0.048224449157714844, -0.04606056213378906, -0.04389667510986328, -0.0417327880859375, -0.03956890106201172, -0.03740501403808594, -0.035241127014160156, -0.033077239990234375, -0.030913352966308594, -0.028749465942382812, -0.02658557891845703, -0.02442169189453125, -0.02225780487060547, -0.020093917846679688, -0.017930030822753906, -0.015766143798828125, -0.013602256774902344, -0.011438369750976562, -0.009274482727050781, -0.007110595703125, -0.004946708679199219, -0.0027828216552734375, -0.0006189346313476562, 0.001544952392578125, 0.0037088394165039062, 0.0058727264404296875, 0.008036613464355469, 0.01020050048828125, 0.012364387512207031, 0.014528274536132812, 0.016692161560058594, 0.018856048583984375, 0.021019935607910156, 0.023183822631835938, 0.02534770965576172, 0.0275115966796875, 0.02967548370361328, 0.03183937072753906, 0.034003257751464844, 0.036167144775390625, 0.038331031799316406, 0.04049491882324219, 0.04265880584716797, 0.04482269287109375, 0.04698657989501953, 0.04915046691894531, 0.051314353942871094, 0.053478240966796875, 0.055642127990722656, 0.05780601501464844, 0.05996990203857422, 0.0621337890625]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 16.0, 54.0, 124.0, 326.0, 280.0, 146.0, 48.0, 11.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.771463394165039, -15.40365982055664, -15.035855293273926, -14.668051719665527, -14.300247192382812, -13.932443618774414, -13.564640045166016, -13.1968355178833, -12.829030990600586, -12.461227416992188, -12.093422889709473, -11.725619316101074, -11.35781478881836, -10.990011215209961, -10.622207641601562, -10.254403114318848, -9.88659954071045, -9.51879596710205, -9.150991439819336, -8.783187866210938, -8.415383338928223, -8.047579765319824, -7.679775714874268, -7.311971664428711, -6.944167613983154, -6.576363563537598, -6.208559513092041, -5.840755462646484, -5.472951889038086, -5.105147361755371, -4.737343788146973, -4.369539737701416, -4.001734733581543, -3.6339306831359863, -3.2661266326904297, -2.898322820663452, -2.5305187702178955, -2.162714719772339, -1.7949109077453613, -1.4271068572998047, -1.059302806854248, -0.6914988160133362, -0.3236948251724243, 0.04410910606384277, 0.4119131565093994, 0.779717206954956, 1.1475210189819336, 1.5153250694274902, 1.8831291198730469, 2.2509331703186035, 2.61873722076416, 2.9865410327911377, 3.3543450832366943, 3.722149133682251, 4.0899529457092285, 4.457756996154785, 4.825561046600342, 5.193365097045898, 5.561169147491455, 5.928973197937012, 6.29677677154541, 6.664581298828125, 7.032384872436523, 7.40018892288208, 7.767992973327637]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 8.0, 8.0, 9.0, 11.0, 19.0, 24.0, 33.0, 27.0, 26.0, 45.0, 29.0, 55.0, 42.0, 42.0, 56.0, 61.0, 51.0, 42.0, 46.0, 50.0, 50.0, 41.0, 28.0, 57.0, 30.0, 23.0, 24.0, 15.0, 17.0, 9.0, 7.0, 8.0, 5.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2903947830200195, -3.199469566345215, -3.1085445880889893, -3.0176193714141846, -2.92669415473938, -2.8357691764831543, -2.7448439598083496, -2.653918743133545, -2.5629937648773193, -2.4720685482025146, -2.381143569946289, -2.2902183532714844, -2.1992931365966797, -2.108368158340454, -2.0174429416656494, -1.9265178442001343, -1.8355926275253296, -1.7446675300598145, -1.6537423133850098, -1.5628172159194946, -1.4718921184539795, -1.3809669017791748, -1.2900418043136597, -1.1991167068481445, -1.1081914901733398, -1.0172663927078247, -0.9263412356376648, -0.8354160785675049, -0.7444909811019897, -0.6535658240318298, -0.5626406669616699, -0.4717155694961548, -0.38079047203063965, -0.2898653447628021, -0.1989402025938034, -0.10801506042480469, -0.017089933156967163, 0.07383519411087036, 0.16476035118103027, 0.2556854486465454, 0.3466106057167053, 0.43753573298454285, 0.5284608602523804, 0.6193860173225403, 0.7103111743927002, 0.8012362718582153, 0.8921614289283752, 0.9830865263938904, 1.0740116834640503, 1.1649367809295654, 1.2558619976043701, 1.3467870950698853, 1.4377121925354004, 1.528637409210205, 1.6195625066757202, 1.7104876041412354, 1.80141282081604, 1.8923379182815552, 1.9832631349563599, 2.074188232421875, 2.1651134490966797, 2.2560384273529053, 2.34696364402771, 2.4378886222839355, 2.5288138389587402]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 4.0, 3.0, 8.0, 7.0, 7.0, 18.0, 26.0, 31.0, 41.0, 59.0, 83.0, 136.0, 200.0, 284.0, 496.0, 869.0, 1626.0, 3197.0, 7241.0, 19381.0, 61379.0, 216335.0, 447963.0, 200713.0, 56645.0, 18155.0, 6884.0, 3034.0, 1521.0, 791.0, 500.0, 315.0, 174.0, 135.0, 68.0, 62.0, 50.0, 25.0, 31.0, 12.0, 18.0, 12.0, 6.0, 1.0, 4.0, 4.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.83203125, -2.742034912109375, -2.65203857421875, -2.562042236328125, -2.4720458984375, -2.382049560546875, -2.29205322265625, -2.202056884765625, -2.112060546875, -2.022064208984375, -1.93206787109375, -1.842071533203125, -1.7520751953125, -1.662078857421875, -1.57208251953125, -1.482086181640625, -1.39208984375, -1.302093505859375, -1.21209716796875, -1.122100830078125, -1.0321044921875, -0.942108154296875, -0.85211181640625, -0.762115478515625, -0.672119140625, -0.582122802734375, -0.49212646484375, -0.402130126953125, -0.3121337890625, -0.222137451171875, -0.13214111328125, -0.042144775390625, 0.0478515625, 0.137847900390625, 0.22784423828125, 0.317840576171875, 0.4078369140625, 0.497833251953125, 0.58782958984375, 0.677825927734375, 0.767822265625, 0.857818603515625, 0.94781494140625, 1.037811279296875, 1.1278076171875, 1.217803955078125, 1.30780029296875, 1.397796630859375, 1.48779296875, 1.577789306640625, 1.66778564453125, 1.757781982421875, 1.8477783203125, 1.937774658203125, 2.02777099609375, 2.117767333984375, 2.207763671875, 2.297760009765625, 2.38775634765625, 2.477752685546875, 2.5677490234375, 2.657745361328125, 2.74774169921875, 2.837738037109375, 2.927734375]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 3.0, 2.0, 5.0, 5.0, 5.0, 8.0, 7.0, 18.0, 8.0, 16.0, 26.0, 19.0, 28.0, 21.0, 26.0, 21.0, 43.0, 34.0, 34.0, 43.0, 39.0, 33.0, 42.0, 38.0, 46.0, 55.0, 39.0, 35.0, 37.0, 26.0, 28.0, 33.0, 19.0, 30.0, 18.0, 24.0, 17.0, 14.0, 16.0, 13.0, 6.0, 10.0, 2.0, 3.0, 2.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-4.21875, -4.097930908203125, -3.97711181640625, -3.856292724609375, -3.7354736328125, -3.614654541015625, -3.49383544921875, -3.373016357421875, -3.252197265625, -3.131378173828125, -3.01055908203125, -2.889739990234375, -2.7689208984375, -2.648101806640625, -2.52728271484375, -2.406463623046875, -2.28564453125, -2.164825439453125, -2.04400634765625, -1.923187255859375, -1.8023681640625, -1.681549072265625, -1.56072998046875, -1.439910888671875, -1.319091796875, -1.198272705078125, -1.07745361328125, -0.956634521484375, -0.8358154296875, -0.714996337890625, -0.59417724609375, -0.473358154296875, -0.3525390625, -0.231719970703125, -0.11090087890625, 0.009918212890625, 0.1307373046875, 0.251556396484375, 0.37237548828125, 0.493194580078125, 0.614013671875, 0.734832763671875, 0.85565185546875, 0.976470947265625, 1.0972900390625, 1.218109130859375, 1.33892822265625, 1.459747314453125, 1.58056640625, 1.701385498046875, 1.82220458984375, 1.943023681640625, 2.0638427734375, 2.184661865234375, 2.30548095703125, 2.426300048828125, 2.547119140625, 2.667938232421875, 2.78875732421875, 2.909576416015625, 3.0303955078125, 3.151214599609375, 3.27203369140625, 3.392852783203125, 3.513671875]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 4.0, 0.0, 3.0, 5.0, 4.0, 6.0, 9.0, 6.0, 15.0, 18.0, 20.0, 31.0, 33.0, 51.0, 75.0, 112.0, 159.0, 232.0, 793.0, 42468.0, 997982.0, 5408.0, 444.0, 212.0, 135.0, 86.0, 72.0, 49.0, 37.0, 22.0, 24.0, 13.0, 7.0, 4.0, 7.0, 3.0, 1.0, 3.0, 3.0, 0.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-20.875, -20.28369140625, -19.6923828125, -19.10107421875, -18.509765625, -17.91845703125, -17.3271484375, -16.73583984375, -16.14453125, -15.55322265625, -14.9619140625, -14.37060546875, -13.779296875, -13.18798828125, -12.5966796875, -12.00537109375, -11.4140625, -10.82275390625, -10.2314453125, -9.64013671875, -9.048828125, -8.45751953125, -7.8662109375, -7.27490234375, -6.68359375, -6.09228515625, -5.5009765625, -4.90966796875, -4.318359375, -3.72705078125, -3.1357421875, -2.54443359375, -1.953125, -1.36181640625, -0.7705078125, -0.17919921875, 0.412109375, 1.00341796875, 1.5947265625, 2.18603515625, 2.77734375, 3.36865234375, 3.9599609375, 4.55126953125, 5.142578125, 5.73388671875, 6.3251953125, 6.91650390625, 7.5078125, 8.09912109375, 8.6904296875, 9.28173828125, 9.873046875, 10.46435546875, 11.0556640625, 11.64697265625, 12.23828125, 12.82958984375, 13.4208984375, 14.01220703125, 14.603515625, 15.19482421875, 15.7861328125, 16.37744140625, 16.96875]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 3.0, 3.0, 5.0, 12.0, 7.0, 10.0, 11.0, 19.0, 35.0, 35.0, 45.0, 57.0, 60.0, 51.0, 43.0, 60.0, 71.0, 67.0, 62.0, 62.0, 51.0, 39.0, 29.0, 37.0, 32.0, 26.0, 15.0, 12.0, 16.0, 8.0, 6.0, 6.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-7.96484375, -7.759033203125, -7.55322265625, -7.347412109375, -7.1416015625, -6.935791015625, -6.72998046875, -6.524169921875, -6.318359375, -6.112548828125, -5.90673828125, -5.700927734375, -5.4951171875, -5.289306640625, -5.08349609375, -4.877685546875, -4.671875, -4.466064453125, -4.26025390625, -4.054443359375, -3.8486328125, -3.642822265625, -3.43701171875, -3.231201171875, -3.025390625, -2.819580078125, -2.61376953125, -2.407958984375, -2.2021484375, -1.996337890625, -1.79052734375, -1.584716796875, -1.37890625, -1.173095703125, -0.96728515625, -0.761474609375, -0.5556640625, -0.349853515625, -0.14404296875, 0.061767578125, 0.267578125, 0.473388671875, 0.67919921875, 0.885009765625, 1.0908203125, 1.296630859375, 1.50244140625, 1.708251953125, 1.9140625, 2.119873046875, 2.32568359375, 2.531494140625, 2.7373046875, 2.943115234375, 3.14892578125, 3.354736328125, 3.560546875, 3.766357421875, 3.97216796875, 4.177978515625, 4.3837890625, 4.589599609375, 4.79541015625, 5.001220703125, 5.20703125]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 2.0, 2.0, 11.0, 12.0, 18.0, 36.0, 51.0, 133.0, 564.0, 9372.0, 1022612.0, 14689.0, 728.0, 145.0, 63.0, 43.0, 23.0, 15.0, 10.0, 10.0, 2.0, 5.0, 2.0, 2.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.8046875, -5.60137939453125, -5.3980712890625, -5.19476318359375, -4.991455078125, -4.78814697265625, -4.5848388671875, -4.38153076171875, -4.17822265625, -3.97491455078125, -3.7716064453125, -3.56829833984375, -3.364990234375, -3.16168212890625, -2.9583740234375, -2.75506591796875, -2.5517578125, -2.34844970703125, -2.1451416015625, -1.94183349609375, -1.738525390625, -1.53521728515625, -1.3319091796875, -1.12860107421875, -0.92529296875, -0.72198486328125, -0.5186767578125, -0.31536865234375, -0.112060546875, 0.09124755859375, 0.2945556640625, 0.49786376953125, 0.701171875, 0.90447998046875, 1.1077880859375, 1.31109619140625, 1.514404296875, 1.71771240234375, 1.9210205078125, 2.12432861328125, 2.32763671875, 2.53094482421875, 2.7342529296875, 2.93756103515625, 3.140869140625, 3.34417724609375, 3.5474853515625, 3.75079345703125, 3.9541015625, 4.15740966796875, 4.3607177734375, 4.56402587890625, 4.767333984375, 4.97064208984375, 5.1739501953125, 5.37725830078125, 5.58056640625, 5.78387451171875, 5.9871826171875, 6.19049072265625, 6.393798828125, 6.59710693359375, 6.8004150390625, 7.00372314453125, 7.20703125]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 1.0, 2.0, 5.0, 7.0, 15.0, 16.0, 22.0, 33.0, 52.0, 89.0, 124.0, 160.0, 136.0, 123.0, 83.0, 39.0, 29.0, 25.0, 17.0, 7.0, 8.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00023257732391357422, -0.00022476725280284882, -0.0002169571816921234, -0.000209147110581398, -0.0002013370394706726, -0.0001935269683599472, -0.0001857168972492218, -0.0001779068261384964, -0.000170096755027771, -0.0001622866839170456, -0.0001544766128063202, -0.0001466665416955948, -0.00013885647058486938, -0.00013104639947414398, -0.00012323632836341858, -0.00011542625725269318, -0.00010761618614196777, -9.980611503124237e-05, -9.199604392051697e-05, -8.418597280979156e-05, -7.637590169906616e-05, -6.856583058834076e-05, -6.0755759477615356e-05, -5.2945688366889954e-05, -4.513561725616455e-05, -3.732554614543915e-05, -2.9515475034713745e-05, -2.1705403923988342e-05, -1.389533281326294e-05, -6.085261702537537e-06, 1.7248094081878662e-06, 9.534880518913269e-06, 1.7344951629638672e-05, 2.5155022740364075e-05, 3.296509385108948e-05, 4.077516496181488e-05, 4.858523607254028e-05, 5.6395307183265686e-05, 6.420537829399109e-05, 7.201544940471649e-05, 7.98255205154419e-05, 8.76355916261673e-05, 9.54456627368927e-05, 0.0001032557338476181, 0.0001110658049583435, 0.00011887587606906891, 0.0001266859471797943, 0.00013449601829051971, 0.00014230608940124512, 0.00015011616051197052, 0.00015792623162269592, 0.00016573630273342133, 0.00017354637384414673, 0.00018135644495487213, 0.00018916651606559753, 0.00019697658717632294, 0.00020478665828704834, 0.00021259672939777374, 0.00022040680050849915, 0.00022821687161922455, 0.00023602694272994995, 0.00024383701384067535, 0.00025164708495140076, 0.00025945715606212616, 0.00026726722717285156]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 9.0, 4.0, 2.0, 8.0, 15.0, 19.0, 18.0, 25.0, 53.0, 83.0, 125.0, 450.0, 5078.0, 823433.0, 216085.0, 2491.0, 356.0, 108.0, 69.0, 35.0, 29.0, 14.0, 15.0, 6.0, 5.0, 6.0, 3.0, 6.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.0234375, -5.860107421875, -5.69677734375, -5.533447265625, -5.3701171875, -5.206787109375, -5.04345703125, -4.880126953125, -4.716796875, -4.553466796875, -4.39013671875, -4.226806640625, -4.0634765625, -3.900146484375, -3.73681640625, -3.573486328125, -3.41015625, -3.246826171875, -3.08349609375, -2.920166015625, -2.7568359375, -2.593505859375, -2.43017578125, -2.266845703125, -2.103515625, -1.940185546875, -1.77685546875, -1.613525390625, -1.4501953125, -1.286865234375, -1.12353515625, -0.960205078125, -0.796875, -0.633544921875, -0.47021484375, -0.306884765625, -0.1435546875, 0.019775390625, 0.18310546875, 0.346435546875, 0.509765625, 0.673095703125, 0.83642578125, 0.999755859375, 1.1630859375, 1.326416015625, 1.48974609375, 1.653076171875, 1.81640625, 1.979736328125, 2.14306640625, 2.306396484375, 2.4697265625, 2.633056640625, 2.79638671875, 2.959716796875, 3.123046875, 3.286376953125, 3.44970703125, 3.613037109375, 3.7763671875, 3.939697265625, 4.10302734375, 4.266357421875, 4.4296875]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 6.0, 7.0, 7.0, 5.0, 7.0, 10.0, 11.0, 15.0, 27.0, 29.0, 39.0, 62.0, 76.0, 90.0, 108.0, 96.0, 97.0, 85.0, 48.0, 44.0, 25.0, 21.0, 21.0, 12.0, 12.0, 9.0, 13.0, 5.0, 5.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.52001953125, -0.5020980834960938, -0.4841766357421875, -0.46625518798828125, -0.448333740234375, -0.43041229248046875, -0.4124908447265625, -0.39456939697265625, -0.37664794921875, -0.35872650146484375, -0.3408050537109375, -0.32288360595703125, -0.304962158203125, -0.28704071044921875, -0.2691192626953125, -0.25119781494140625, -0.2332763671875, -0.21535491943359375, -0.1974334716796875, -0.17951202392578125, -0.161590576171875, -0.14366912841796875, -0.1257476806640625, -0.10782623291015625, -0.08990478515625, -0.07198333740234375, -0.0540618896484375, -0.03614044189453125, -0.018218994140625, -0.00029754638671875, 0.0176239013671875, 0.03554534912109375, 0.053466796875, 0.07138824462890625, 0.0893096923828125, 0.10723114013671875, 0.125152587890625, 0.14307403564453125, 0.1609954833984375, 0.17891693115234375, 0.19683837890625, 0.21475982666015625, 0.2326812744140625, 0.25060272216796875, 0.268524169921875, 0.28644561767578125, 0.3043670654296875, 0.32228851318359375, 0.3402099609375, 0.35813140869140625, 0.3760528564453125, 0.39397430419921875, 0.411895751953125, 0.42981719970703125, 0.4477386474609375, 0.46566009521484375, 0.48358154296875, 0.5015029907226562, 0.5194244384765625, 0.5373458862304688, 0.555267333984375, 0.5731887817382812, 0.5911102294921875, 0.6090316772460938, 0.626953125]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 15.0, 168.0, 620.0, 193.0, 16.0, 0.0, 1.0, 1.0], "bins": [-85.31723022460938, -83.857666015625, -82.3980941772461, -80.93852996826172, -79.47895812988281, -78.01939392089844, -76.55982971191406, -75.10025787353516, -73.64069366455078, -72.1811294555664, -70.7215576171875, -69.26199340820312, -67.80242156982422, -66.34285736083984, -64.88328552246094, -63.42372131347656, -61.96415328979492, -60.50458526611328, -59.04501724243164, -57.58544921875, -56.125885009765625, -54.666316986083984, -53.206748962402344, -51.7471809387207, -50.28761291503906, -48.82804489135742, -47.36847686767578, -45.908912658691406, -44.449344635009766, -42.989776611328125, -41.530208587646484, -40.070640563964844, -38.61107635498047, -37.15150833129883, -35.69194030761719, -34.23237609863281, -32.77280807495117, -31.31324005126953, -29.85367202758789, -28.39410400390625, -26.93453598022461, -25.47496795654297, -24.01540184020996, -22.55583381652832, -21.096267700195312, -19.636699676513672, -18.17713165283203, -16.71756362915039, -15.2579984664917, -13.798431396484375, -12.338863372802734, -10.87929630279541, -9.419729232788086, -7.960162162780762, -6.500594139099121, -5.041027069091797, -3.5814599990844727, -2.1218926906585693, -0.662325382232666, 0.7972421646118164, 2.2568092346191406, 3.716376304626465, 5.1759443283081055, 6.63551139831543, 8.095078468322754]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 7.0, 8.0, 12.0, 17.0, 15.0, 25.0, 35.0, 33.0, 36.0, 50.0, 46.0, 42.0, 57.0, 55.0, 54.0, 60.0, 64.0, 45.0, 52.0, 52.0, 39.0, 36.0, 32.0, 34.0, 24.0, 29.0, 21.0, 13.0, 5.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-12.296927452087402, -12.023918151855469, -11.750909805297852, -11.477900505065918, -11.2048921585083, -10.931882858276367, -10.65887451171875, -10.385865211486816, -10.112855911254883, -9.83984661102295, -9.566838264465332, -9.293828964233398, -9.020820617675781, -8.747811317443848, -8.474802017211914, -8.201793670654297, -7.9287848472595215, -7.655776023864746, -7.382767200469971, -7.109758377075195, -6.836749076843262, -6.563740253448486, -6.290731430053711, -6.0177226066589355, -5.74471378326416, -5.471704959869385, -5.198696136474609, -4.925686836242676, -4.6526780128479, -4.379669189453125, -4.10666036605835, -3.833651542663574, -3.5606422424316406, -3.2876334190368652, -3.0146243572235107, -2.7416155338287354, -2.468606472015381, -2.1955976486206055, -1.92258882522583, -1.6495798826217651, -1.3765709400177002, -1.1035619974136353, -0.8305531144142151, -0.5575442314147949, -0.28453528881073, -0.011526346206665039, 0.26148247718811035, 0.5344914197921753, 0.8075003623962402, 1.0805093050003052, 1.3535182476043701, 1.6265270709991455, 1.8995360136032104, 2.1725449562072754, 2.445553779602051, 2.718562602996826, 2.9915716648101807, 3.264580488204956, 3.5375895500183105, 3.810598373413086, 4.083607196807861, 4.356616020202637, 4.62962532043457, 4.902634143829346, 5.175642967224121]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 4.0, 8.0, 9.0, 11.0, 14.0, 15.0, 18.0, 31.0, 46.0, 52.0, 68.0, 109.0, 158.0, 224.0, 459.0, 1030.0, 3160.0, 14816.0, 116820.0, 1104153.0, 2380266.0, 508989.0, 51117.0, 8597.0, 2405.0, 840.0, 303.0, 178.0, 107.0, 78.0, 38.0, 47.0, 30.0, 18.0, 11.0, 9.0, 8.0, 13.0, 11.0, 5.0, 2.0, 4.0, 2.0, 1.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-4.33203125, -4.17340087890625, -4.0147705078125, -3.85614013671875, -3.697509765625, -3.53887939453125, -3.3802490234375, -3.22161865234375, -3.06298828125, -2.90435791015625, -2.7457275390625, -2.58709716796875, -2.428466796875, -2.26983642578125, -2.1112060546875, -1.95257568359375, -1.7939453125, -1.63531494140625, -1.4766845703125, -1.31805419921875, -1.159423828125, -1.00079345703125, -0.8421630859375, -0.68353271484375, -0.52490234375, -0.36627197265625, -0.2076416015625, -0.04901123046875, 0.109619140625, 0.26824951171875, 0.4268798828125, 0.58551025390625, 0.744140625, 0.90277099609375, 1.0614013671875, 1.22003173828125, 1.378662109375, 1.53729248046875, 1.6959228515625, 1.85455322265625, 2.01318359375, 2.17181396484375, 2.3304443359375, 2.48907470703125, 2.647705078125, 2.80633544921875, 2.9649658203125, 3.12359619140625, 3.2822265625, 3.44085693359375, 3.5994873046875, 3.75811767578125, 3.916748046875, 4.07537841796875, 4.2340087890625, 4.39263916015625, 4.55126953125, 4.70989990234375, 4.8685302734375, 5.02716064453125, 5.185791015625, 5.34442138671875, 5.5030517578125, 5.66168212890625, 5.8203125]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 3.0, 1.0, 7.0, 11.0, 9.0, 26.0, 25.0, 36.0, 46.0, 47.0, 53.0, 55.0, 46.0, 53.0, 51.0, 89.0, 67.0, 62.0, 57.0, 54.0, 42.0, 32.0, 22.0, 36.0, 21.0, 19.0, 13.0, 7.0, 7.0, 7.0, 4.0, 0.0, 1.0, 2.0], "bins": [-5.578125, -5.454620361328125, -5.33111572265625, -5.207611083984375, -5.0841064453125, -4.960601806640625, -4.83709716796875, -4.713592529296875, -4.590087890625, -4.466583251953125, -4.34307861328125, -4.219573974609375, -4.0960693359375, -3.972564697265625, -3.84906005859375, -3.725555419921875, -3.60205078125, -3.478546142578125, -3.35504150390625, -3.231536865234375, -3.1080322265625, -2.984527587890625, -2.86102294921875, -2.737518310546875, -2.614013671875, -2.490509033203125, -2.36700439453125, -2.243499755859375, -2.1199951171875, -1.996490478515625, -1.87298583984375, -1.749481201171875, -1.6259765625, -1.502471923828125, -1.37896728515625, -1.255462646484375, -1.1319580078125, -1.008453369140625, -0.88494873046875, -0.761444091796875, -0.637939453125, -0.514434814453125, -0.39093017578125, -0.267425537109375, -0.1439208984375, -0.020416259765625, 0.10308837890625, 0.226593017578125, 0.35009765625, 0.473602294921875, 0.59710693359375, 0.720611572265625, 0.8441162109375, 0.967620849609375, 1.09112548828125, 1.214630126953125, 1.338134765625, 1.461639404296875, 1.58514404296875, 1.708648681640625, 1.8321533203125, 1.955657958984375, 2.07916259765625, 2.202667236328125, 2.326171875]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 4.0, 14.0, 15.0, 26.0, 60.0, 127.0, 371.0, 1872.0, 334143.0, 3851824.0, 4903.0, 562.0, 194.0, 71.0, 32.0, 24.0, 10.0, 5.0, 4.0, 5.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.109375, -16.4794921875, -15.849609375, -15.2197265625, -14.58984375, -13.9599609375, -13.330078125, -12.7001953125, -12.0703125, -11.4404296875, -10.810546875, -10.1806640625, -9.55078125, -8.9208984375, -8.291015625, -7.6611328125, -7.03125, -6.4013671875, -5.771484375, -5.1416015625, -4.51171875, -3.8818359375, -3.251953125, -2.6220703125, -1.9921875, -1.3623046875, -0.732421875, -0.1025390625, 0.52734375, 1.1572265625, 1.787109375, 2.4169921875, 3.046875, 3.6767578125, 4.306640625, 4.9365234375, 5.56640625, 6.1962890625, 6.826171875, 7.4560546875, 8.0859375, 8.7158203125, 9.345703125, 9.9755859375, 10.60546875, 11.2353515625, 11.865234375, 12.4951171875, 13.125, 13.7548828125, 14.384765625, 15.0146484375, 15.64453125, 16.2744140625, 16.904296875, 17.5341796875, 18.1640625, 18.7939453125, 19.423828125, 20.0537109375, 20.68359375, 21.3134765625, 21.943359375, 22.5732421875, 23.203125]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 8.0, 4.0, 14.0, 14.0, 25.0, 32.0, 63.0, 85.0, 134.0, 216.0, 317.0, 529.0, 643.0, 676.0, 485.0, 303.0, 192.0, 109.0, 78.0, 48.0, 39.0, 19.0, 16.0, 13.0, 1.0, 5.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.87109375, -1.814117431640625, -1.75714111328125, -1.700164794921875, -1.6431884765625, -1.586212158203125, -1.52923583984375, -1.472259521484375, -1.415283203125, -1.358306884765625, -1.30133056640625, -1.244354248046875, -1.1873779296875, -1.130401611328125, -1.07342529296875, -1.016448974609375, -0.95947265625, -0.902496337890625, -0.84552001953125, -0.788543701171875, -0.7315673828125, -0.674591064453125, -0.61761474609375, -0.560638427734375, -0.503662109375, -0.446685791015625, -0.38970947265625, -0.332733154296875, -0.2757568359375, -0.218780517578125, -0.16180419921875, -0.104827880859375, -0.0478515625, 0.009124755859375, 0.06610107421875, 0.123077392578125, 0.1800537109375, 0.237030029296875, 0.29400634765625, 0.350982666015625, 0.407958984375, 0.464935302734375, 0.52191162109375, 0.578887939453125, 0.6358642578125, 0.692840576171875, 0.74981689453125, 0.806793212890625, 0.86376953125, 0.920745849609375, 0.97772216796875, 1.034698486328125, 1.0916748046875, 1.148651123046875, 1.20562744140625, 1.262603759765625, 1.319580078125, 1.376556396484375, 1.43353271484375, 1.490509033203125, 1.5474853515625, 1.604461669921875, 1.66143798828125, 1.718414306640625, 1.775390625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 13.0, 36.0, 64.0, 100.0, 202.0, 204.0, 174.0, 108.0, 62.0, 31.0, 6.0, 3.0, 2.0], "bins": [-20.78423500061035, -20.415246963500977, -20.04625701904297, -19.677268981933594, -19.30828094482422, -18.939292907714844, -18.570302963256836, -18.20131492614746, -17.832326889038086, -17.46333885192871, -17.094348907470703, -16.725360870361328, -16.356372833251953, -15.987383842468262, -15.61839485168457, -15.249406814575195, -14.880417823791504, -14.511428833007812, -14.142440795898438, -13.773451805114746, -13.404463768005371, -13.03547477722168, -12.666486740112305, -12.297497749328613, -11.928508758544922, -11.55951976776123, -11.190531730651855, -10.821542739868164, -10.452554702758789, -10.083565711975098, -9.714576721191406, -9.345588684082031, -8.976601600646973, -8.607612609863281, -8.238624572753906, -7.869635581970215, -7.50064754486084, -7.131658554077148, -6.762670040130615, -6.393681526184082, -6.024693012237549, -5.655704498291016, -5.286715984344482, -4.917727470397949, -4.548738479614258, -4.179750442504883, -3.8107614517211914, -3.441772937774658, -3.072784423828125, -2.703795909881592, -2.3348073959350586, -1.9658186435699463, -1.596830129623413, -1.2278416156768799, -0.8588528633117676, -0.4898643493652344, -0.12087583541870117, 0.2481127381324768, 0.6171013116836548, 0.9860899448394775, 1.3550784587860107, 1.724066972732544, 2.0930557250976562, 2.4620442390441895, 2.8310327529907227]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 6.0, 8.0, 10.0, 11.0, 22.0, 20.0, 26.0, 26.0, 39.0, 24.0, 38.0, 50.0, 43.0, 54.0, 62.0, 70.0, 49.0, 59.0, 58.0, 64.0, 48.0, 33.0, 28.0, 39.0, 16.0, 30.0, 22.0, 15.0, 12.0, 10.0, 4.0, 0.0, 6.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.130297660827637, -3.998098850250244, -3.8659000396728516, -3.733701229095459, -3.6015024185180664, -3.469303607940674, -3.3371047973632812, -3.2049059867858887, -3.072707176208496, -2.9405083656311035, -2.808309555053711, -2.6761107444763184, -2.543911933898926, -2.411713123321533, -2.2795143127441406, -2.147315502166748, -2.0151166915893555, -1.882917881011963, -1.7507190704345703, -1.6185202598571777, -1.4863214492797852, -1.3541226387023926, -1.221923828125, -1.0897250175476074, -0.9575262069702148, -0.8253273963928223, -0.6931285858154297, -0.5609297752380371, -0.42873096466064453, -0.29653215408325195, -0.16433334350585938, -0.0321345329284668, 0.10006427764892578, 0.23226308822631836, 0.36446189880371094, 0.4966607093811035, 0.6288595199584961, 0.7610583305358887, 0.8932571411132812, 1.0254559516906738, 1.1576547622680664, 1.289853572845459, 1.4220523834228516, 1.5542511940002441, 1.6864500045776367, 1.8186488151550293, 1.9508476257324219, 2.0830464363098145, 2.215245246887207, 2.3474440574645996, 2.479642868041992, 2.6118416786193848, 2.7440404891967773, 2.87623929977417, 3.0084381103515625, 3.140636920928955, 3.2728357315063477, 3.4050345420837402, 3.537233352661133, 3.6694321632385254, 3.801630973815918, 3.9338297843933105, 4.066028594970703, 4.198227405548096, 4.330426216125488]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 5.0, 3.0, 4.0, 2.0, 6.0, 7.0, 12.0, 11.0, 21.0, 38.0, 50.0, 82.0, 131.0, 218.0, 440.0, 784.0, 1471.0, 3361.0, 9095.0, 42916.0, 325214.0, 551282.0, 89545.0, 15099.0, 4552.0, 1968.0, 985.0, 519.0, 298.0, 149.0, 107.0, 61.0, 48.0, 28.0, 18.0, 9.0, 5.0, 6.0, 4.0, 5.0, 0.0, 0.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.9404296875, -0.9030914306640625, -0.865753173828125, -0.8284149169921875, -0.79107666015625, -0.7537384033203125, -0.716400146484375, -0.6790618896484375, -0.6417236328125, -0.6043853759765625, -0.567047119140625, -0.5297088623046875, -0.49237060546875, -0.4550323486328125, -0.417694091796875, -0.3803558349609375, -0.343017578125, -0.3056793212890625, -0.268341064453125, -0.2310028076171875, -0.19366455078125, -0.1563262939453125, -0.118988037109375, -0.0816497802734375, -0.0443115234375, -0.0069732666015625, 0.030364990234375, 0.0677032470703125, 0.10504150390625, 0.1423797607421875, 0.179718017578125, 0.2170562744140625, 0.25439453125, 0.2917327880859375, 0.329071044921875, 0.3664093017578125, 0.40374755859375, 0.4410858154296875, 0.478424072265625, 0.5157623291015625, 0.5531005859375, 0.5904388427734375, 0.627777099609375, 0.6651153564453125, 0.70245361328125, 0.7397918701171875, 0.777130126953125, 0.8144683837890625, 0.851806640625, 0.8891448974609375, 0.926483154296875, 0.9638214111328125, 1.00115966796875, 1.0384979248046875, 1.075836181640625, 1.1131744384765625, 1.1505126953125, 1.1878509521484375, 1.225189208984375, 1.2625274658203125, 1.29986572265625, 1.3372039794921875, 1.374542236328125, 1.4118804931640625, 1.44921875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 6.0, 13.0, 14.0, 19.0, 24.0, 15.0, 34.0, 28.0, 31.0, 47.0, 48.0, 46.0, 63.0, 65.0, 66.0, 80.0, 56.0, 63.0, 55.0, 44.0, 36.0, 38.0, 20.0, 32.0, 24.0, 15.0, 7.0, 3.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.556640625, -3.466522216796875, -3.37640380859375, -3.286285400390625, -3.1961669921875, -3.106048583984375, -3.01593017578125, -2.925811767578125, -2.835693359375, -2.745574951171875, -2.65545654296875, -2.565338134765625, -2.4752197265625, -2.385101318359375, -2.29498291015625, -2.204864501953125, -2.11474609375, -2.024627685546875, -1.93450927734375, -1.844390869140625, -1.7542724609375, -1.664154052734375, -1.57403564453125, -1.483917236328125, -1.393798828125, -1.303680419921875, -1.21356201171875, -1.123443603515625, -1.0333251953125, -0.943206787109375, -0.85308837890625, -0.762969970703125, -0.6728515625, -0.582733154296875, -0.49261474609375, -0.402496337890625, -0.3123779296875, -0.222259521484375, -0.13214111328125, -0.042022705078125, 0.048095703125, 0.138214111328125, 0.22833251953125, 0.318450927734375, 0.4085693359375, 0.498687744140625, 0.58880615234375, 0.678924560546875, 0.76904296875, 0.859161376953125, 0.94927978515625, 1.039398193359375, 1.1295166015625, 1.219635009765625, 1.30975341796875, 1.399871826171875, 1.489990234375, 1.580108642578125, 1.67022705078125, 1.760345458984375, 1.8504638671875, 1.940582275390625, 2.03070068359375, 2.120819091796875, 2.2109375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 9.0, 11.0, 11.0, 27.0, 17.0, 46.0, 56.0, 81.0, 120.0, 162.0, 238.0, 356.0, 569.0, 826.0, 1421.0, 2224.0, 3783.0, 6582.0, 11952.0, 21316.0, 39950.0, 73557.0, 128638.0, 192301.0, 206584.0, 153791.0, 91582.0, 49808.0, 27328.0, 14734.0, 8248.0, 4775.0, 2735.0, 1671.0, 1017.0, 630.0, 467.0, 296.0, 197.0, 125.0, 83.0, 64.0, 47.0, 38.0, 21.0, 22.0, 11.0, 10.0, 10.0, 8.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2496337890625, -0.24162864685058594, -0.23362350463867188, -0.2256183624267578, -0.21761322021484375, -0.2096080780029297, -0.20160293579101562, -0.19359779357910156, -0.1855926513671875, -0.17758750915527344, -0.16958236694335938, -0.1615772247314453, -0.15357208251953125, -0.1455669403076172, -0.13756179809570312, -0.12955665588378906, -0.121551513671875, -0.11354637145996094, -0.10554122924804688, -0.09753608703613281, -0.08953094482421875, -0.08152580261230469, -0.07352066040039062, -0.06551551818847656, -0.0575103759765625, -0.04950523376464844, -0.041500091552734375, -0.03349494934082031, -0.02548980712890625, -0.017484664916992188, -0.009479522705078125, -0.0014743804931640625, 0.00653076171875, 0.014535903930664062, 0.022541046142578125, 0.030546188354492188, 0.03855133056640625, 0.04655647277832031, 0.054561614990234375, 0.06256675720214844, 0.0705718994140625, 0.07857704162597656, 0.08658218383789062, 0.09458732604980469, 0.10259246826171875, 0.11059761047363281, 0.11860275268554688, 0.12660789489746094, 0.134613037109375, 0.14261817932128906, 0.15062332153320312, 0.1586284637451172, 0.16663360595703125, 0.1746387481689453, 0.18264389038085938, 0.19064903259277344, 0.1986541748046875, 0.20665931701660156, 0.21466445922851562, 0.2226696014404297, 0.23067474365234375, 0.2386798858642578, 0.24668502807617188, 0.25469017028808594, 0.2626953125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 3.0, 0.0, 7.0, 11.0, 7.0, 12.0, 18.0, 18.0, 14.0, 13.0, 25.0, 30.0, 41.0, 51.0, 48.0, 60.0, 48.0, 50.0, 60.0, 59.0, 52.0, 57.0, 37.0, 44.0, 41.0, 36.0, 25.0, 23.0, 33.0, 18.0, 15.0, 8.0, 6.0, 9.0, 7.0, 6.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0], "bins": [-4.6015625, -4.460205078125, -4.31884765625, -4.177490234375, -4.0361328125, -3.894775390625, -3.75341796875, -3.612060546875, -3.470703125, -3.329345703125, -3.18798828125, -3.046630859375, -2.9052734375, -2.763916015625, -2.62255859375, -2.481201171875, -2.33984375, -2.198486328125, -2.05712890625, -1.915771484375, -1.7744140625, -1.633056640625, -1.49169921875, -1.350341796875, -1.208984375, -1.067626953125, -0.92626953125, -0.784912109375, -0.6435546875, -0.502197265625, -0.36083984375, -0.219482421875, -0.078125, 0.063232421875, 0.20458984375, 0.345947265625, 0.4873046875, 0.628662109375, 0.77001953125, 0.911376953125, 1.052734375, 1.194091796875, 1.33544921875, 1.476806640625, 1.6181640625, 1.759521484375, 1.90087890625, 2.042236328125, 2.18359375, 2.324951171875, 2.46630859375, 2.607666015625, 2.7490234375, 2.890380859375, 3.03173828125, 3.173095703125, 3.314453125, 3.455810546875, 3.59716796875, 3.738525390625, 3.8798828125, 4.021240234375, 4.16259765625, 4.303955078125, 4.4453125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 6.0, 8.0, 8.0, 13.0, 17.0, 20.0, 36.0, 49.0, 71.0, 112.0, 167.0, 258.0, 412.0, 727.0, 1465.0, 3459.0, 9148.0, 31091.0, 131849.0, 444928.0, 319329.0, 75059.0, 19021.0, 6267.0, 2423.0, 1052.0, 583.0, 344.0, 183.0, 118.0, 100.0, 63.0, 46.0, 30.0, 23.0, 14.0, 16.0, 13.0, 12.0, 6.0, 2.0, 4.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0673828125, -0.06519603729248047, -0.06300926208496094, -0.060822486877441406, -0.058635711669921875, -0.056448936462402344, -0.05426216125488281, -0.05207538604736328, -0.04988861083984375, -0.04770183563232422, -0.04551506042480469, -0.043328285217285156, -0.041141510009765625, -0.038954734802246094, -0.03676795959472656, -0.03458118438720703, -0.0323944091796875, -0.03020763397216797, -0.028020858764648438, -0.025834083557128906, -0.023647308349609375, -0.021460533142089844, -0.019273757934570312, -0.01708698272705078, -0.01490020751953125, -0.012713432312011719, -0.010526657104492188, -0.008339881896972656, -0.006153106689453125, -0.003966331481933594, -0.0017795562744140625, 0.00040721893310546875, 0.002593994140625, 0.004780769348144531, 0.0069675445556640625, 0.009154319763183594, 0.011341094970703125, 0.013527870178222656, 0.015714645385742188, 0.01790142059326172, 0.02008819580078125, 0.02227497100830078, 0.024461746215820312, 0.026648521423339844, 0.028835296630859375, 0.031022071838378906, 0.03320884704589844, 0.03539562225341797, 0.0375823974609375, 0.03976917266845703, 0.04195594787597656, 0.044142723083496094, 0.046329498291015625, 0.048516273498535156, 0.05070304870605469, 0.05288982391357422, 0.05507659912109375, 0.05726337432861328, 0.05945014953613281, 0.061636924743652344, 0.06382369995117188, 0.0660104751586914, 0.06819725036621094, 0.07038402557373047, 0.07257080078125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 1.0, 7.0, 7.0, 10.0, 15.0, 7.0, 15.0, 16.0, 36.0, 36.0, 42.0, 49.0, 50.0, 75.0, 72.0, 68.0, 65.0, 81.0, 70.0, 63.0, 41.0, 39.0, 32.0, 22.0, 20.0, 14.0, 12.0, 6.0, 8.0, 5.0, 1.0, 4.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.349781036376953e-05, -3.233086317777634e-05, -3.116391599178314e-05, -2.9996968805789948e-05, -2.8830021619796753e-05, -2.766307443380356e-05, -2.6496127247810364e-05, -2.532918006181717e-05, -2.4162232875823975e-05, -2.299528568983078e-05, -2.1828338503837585e-05, -2.066139131784439e-05, -1.9494444131851196e-05, -1.8327496945858002e-05, -1.7160549759864807e-05, -1.5993602573871613e-05, -1.4826655387878418e-05, -1.3659708201885223e-05, -1.2492761015892029e-05, -1.1325813829898834e-05, -1.015886664390564e-05, -8.991919457912445e-06, -7.82497227191925e-06, -6.658025085926056e-06, -5.491077899932861e-06, -4.324130713939667e-06, -3.157183527946472e-06, -1.9902363419532776e-06, -8.23289155960083e-07, 3.4365803003311157e-07, 1.5106052160263062e-06, 2.6775524020195007e-06, 3.844499588012695e-06, 5.01144677400589e-06, 6.1783939599990845e-06, 7.345341145992279e-06, 8.512288331985474e-06, 9.679235517978668e-06, 1.0846182703971863e-05, 1.2013129889965057e-05, 1.3180077075958252e-05, 1.4347024261951447e-05, 1.551397144794464e-05, 1.6680918633937836e-05, 1.784786581993103e-05, 1.9014813005924225e-05, 2.018176019191742e-05, 2.1348707377910614e-05, 2.251565456390381e-05, 2.3682601749897003e-05, 2.4849548935890198e-05, 2.6016496121883392e-05, 2.7183443307876587e-05, 2.835039049386978e-05, 2.9517337679862976e-05, 3.068428486585617e-05, 3.1851232051849365e-05, 3.301817923784256e-05, 3.4185126423835754e-05, 3.535207360982895e-05, 3.6519020795822144e-05, 3.768596798181534e-05, 3.885291516780853e-05, 4.001986235380173e-05, 4.118680953979492e-05]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 3.0, 4.0, 8.0, 2.0, 11.0, 14.0, 15.0, 23.0, 26.0, 33.0, 50.0, 97.0, 178.0, 362.0, 800.0, 2223.0, 7223.0, 29406.0, 206644.0, 641897.0, 129950.0, 20968.0, 5475.0, 1762.0, 685.0, 307.0, 136.0, 74.0, 55.0, 35.0, 23.0, 20.0, 11.0, 9.0, 8.0, 7.0, 3.0, 2.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.10406494140625, -0.10074996948242188, -0.09743499755859375, -0.09412002563476562, -0.0908050537109375, -0.08749008178710938, -0.08417510986328125, -0.08086013793945312, -0.077545166015625, -0.07423019409179688, -0.07091522216796875, -0.06760025024414062, -0.0642852783203125, -0.060970306396484375, -0.05765533447265625, -0.054340362548828125, -0.051025390625, -0.047710418701171875, -0.04439544677734375, -0.041080474853515625, -0.0377655029296875, -0.034450531005859375, -0.03113555908203125, -0.027820587158203125, -0.024505615234375, -0.021190643310546875, -0.01787567138671875, -0.014560699462890625, -0.0112457275390625, -0.007930755615234375, -0.00461578369140625, -0.001300811767578125, 0.00201416015625, 0.005329132080078125, 0.00864410400390625, 0.011959075927734375, 0.0152740478515625, 0.018589019775390625, 0.02190399169921875, 0.025218963623046875, 0.028533935546875, 0.031848907470703125, 0.03516387939453125, 0.038478851318359375, 0.0417938232421875, 0.045108795166015625, 0.04842376708984375, 0.051738739013671875, 0.0550537109375, 0.058368682861328125, 0.06168365478515625, 0.06499862670898438, 0.0683135986328125, 0.07162857055664062, 0.07494354248046875, 0.07825851440429688, 0.081573486328125, 0.08488845825195312, 0.08820343017578125, 0.09151840209960938, 0.0948333740234375, 0.09814834594726562, 0.10146331787109375, 0.10477828979492188, 0.10809326171875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 4.0, 2.0, 5.0, 6.0, 4.0, 7.0, 8.0, 17.0, 13.0, 16.0, 26.0, 30.0, 43.0, 58.0, 79.0, 123.0, 103.0, 107.0, 102.0, 55.0, 42.0, 38.0, 24.0, 11.0, 14.0, 11.0, 5.0, 11.0, 6.0, 5.0, 3.0, 3.0, 2.0, 7.0, 2.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.0247039794921875, -0.023903608322143555, -0.02310323715209961, -0.022302865982055664, -0.02150249481201172, -0.020702123641967773, -0.019901752471923828, -0.019101381301879883, -0.018301010131835938, -0.017500638961791992, -0.016700267791748047, -0.0158998966217041, -0.015099525451660156, -0.014299154281616211, -0.013498783111572266, -0.01269841194152832, -0.011898040771484375, -0.01109766960144043, -0.010297298431396484, -0.009496927261352539, -0.008696556091308594, -0.007896184921264648, -0.007095813751220703, -0.006295442581176758, -0.0054950714111328125, -0.004694700241088867, -0.003894329071044922, -0.0030939579010009766, -0.0022935867309570312, -0.001493215560913086, -0.0006928443908691406, 0.00010752677917480469, 0.00090789794921875, 0.0017082691192626953, 0.0025086402893066406, 0.003309011459350586, 0.004109382629394531, 0.0049097537994384766, 0.005710124969482422, 0.006510496139526367, 0.0073108673095703125, 0.008111238479614258, 0.008911609649658203, 0.009711980819702148, 0.010512351989746094, 0.011312723159790039, 0.012113094329833984, 0.01291346549987793, 0.013713836669921875, 0.01451420783996582, 0.015314579010009766, 0.01611495018005371, 0.016915321350097656, 0.0177156925201416, 0.018516063690185547, 0.019316434860229492, 0.020116806030273438, 0.020917177200317383, 0.021717548370361328, 0.022517919540405273, 0.02331829071044922, 0.024118661880493164, 0.02491903305053711, 0.025719404220581055, 0.026519775390625]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 1.0, 4.0, 16.0, 42.0, 75.0, 167.0, 244.0, 219.0, 135.0, 70.0, 22.0, 10.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.225727081298828, -10.974468231201172, -10.7232084274292, -10.471949577331543, -10.220690727233887, -9.969430923461914, -9.718172073364258, -9.466913223266602, -9.215653419494629, -8.964394569396973, -8.713134765625, -8.461875915527344, -8.210617065429688, -7.959357261657715, -7.708098411560059, -7.456839084625244, -7.205580234527588, -6.954320907592773, -6.703062057495117, -6.451802730560303, -6.200543403625488, -5.949284553527832, -5.698025226593018, -5.446765899658203, -5.195507049560547, -4.944247722625732, -4.692988872528076, -4.441729545593262, -4.190470218658447, -3.939211130142212, -3.6879520416259766, -3.436692714691162, -3.1854333877563477, -2.9341742992401123, -2.682914972305298, -2.4316558837890625, -2.180396556854248, -1.9291374683380127, -1.6778783798217773, -1.4266191720962524, -1.1753599643707275, -0.9241007566452026, -0.6728416085243225, -0.4215824604034424, -0.17032325267791748, 0.08093595504760742, 0.3321950435638428, 0.5834542512893677, 0.8347134590148926, 1.0859726667404175, 1.3372318744659424, 1.5884909629821777, 1.8397501707077026, 2.0910093784332275, 2.342268466949463, 2.5935277938842773, 2.8447868824005127, 3.096045970916748, 3.3473052978515625, 3.598564386367798, 3.849823474884033, 4.101082801818848, 4.352341651916504, 4.603600978851318, 4.854860305786133]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 5.0, 7.0, 6.0, 17.0, 30.0, 33.0, 36.0, 46.0, 45.0, 66.0, 65.0, 96.0, 85.0, 71.0, 94.0, 80.0, 44.0, 42.0, 43.0, 34.0, 27.0, 14.0, 12.0, 3.0, 1.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.771545886993408, -3.659273624420166, -3.547001361846924, -3.4347290992736816, -3.3224568367004395, -3.2101845741271973, -3.097912311553955, -2.985640048980713, -2.8733677864074707, -2.7610955238342285, -2.6488232612609863, -2.536550998687744, -2.424278736114502, -2.3120064735412598, -2.1997342109680176, -2.0874619483947754, -1.9751899242401123, -1.8629176616668701, -1.750645399093628, -1.6383731365203857, -1.5261008739471436, -1.4138286113739014, -1.3015564680099487, -1.1892842054367065, -1.0770119428634644, -0.9647396802902222, -0.85246741771698, -0.7401952147483826, -0.6279229521751404, -0.5156506896018982, -0.4033784866333008, -0.2911062240600586, -0.1788339614868164, -0.06656171381473541, 0.04571053385734558, 0.15798276662826538, 0.27025502920150757, 0.38252729177474976, 0.49479949474334717, 0.6070717573165894, 0.7193440198898315, 0.8316162824630737, 0.9438885450363159, 1.0561606884002686, 1.1684329509735107, 1.280705213546753, 1.3929774761199951, 1.5052497386932373, 1.6175220012664795, 1.7297942638397217, 1.8420665264129639, 1.954338788986206, 2.0666110515594482, 2.1788833141326904, 2.2911553382873535, 2.4034276008605957, 2.515699863433838, 2.62797212600708, 2.7402443885803223, 2.8525166511535645, 2.9647889137268066, 3.077061176300049, 3.189333438873291, 3.301605701446533, 3.4138779640197754]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 5.0, 5.0, 10.0, 19.0, 34.0, 46.0, 91.0, 163.0, 370.0, 752.0, 2299.0, 6714.0, 23156.0, 89616.0, 402289.0, 400073.0, 89881.0, 22710.0, 6522.0, 2100.0, 883.0, 384.0, 176.0, 101.0, 68.0, 28.0, 19.0, 15.0, 12.0, 2.0, 0.0, 4.0, 3.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.892578125, -2.812225341796875, -2.73187255859375, -2.651519775390625, -2.5711669921875, -2.490814208984375, -2.41046142578125, -2.330108642578125, -2.249755859375, -2.169403076171875, -2.08905029296875, -2.008697509765625, -1.9283447265625, -1.847991943359375, -1.76763916015625, -1.687286376953125, -1.60693359375, -1.526580810546875, -1.44622802734375, -1.365875244140625, -1.2855224609375, -1.205169677734375, -1.12481689453125, -1.044464111328125, -0.964111328125, -0.883758544921875, -0.80340576171875, -0.723052978515625, -0.6427001953125, -0.562347412109375, -0.48199462890625, -0.401641845703125, -0.3212890625, -0.240936279296875, -0.16058349609375, -0.080230712890625, 0.0001220703125, 0.080474853515625, 0.16082763671875, 0.241180419921875, 0.321533203125, 0.401885986328125, 0.48223876953125, 0.562591552734375, 0.6429443359375, 0.723297119140625, 0.80364990234375, 0.884002685546875, 0.96435546875, 1.044708251953125, 1.12506103515625, 1.205413818359375, 1.2857666015625, 1.366119384765625, 1.44647216796875, 1.526824951171875, 1.607177734375, 1.687530517578125, 1.76788330078125, 1.848236083984375, 1.9285888671875, 2.008941650390625, 2.08929443359375, 2.169647216796875, 2.25]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 5.0, 6.0, 7.0, 5.0, 8.0, 15.0, 11.0, 26.0, 29.0, 22.0, 33.0, 45.0, 42.0, 37.0, 61.0, 53.0, 62.0, 58.0, 68.0, 56.0, 61.0, 52.0, 42.0, 43.0, 36.0, 24.0, 25.0, 23.0, 20.0, 13.0, 7.0, 4.0, 5.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.04296875, -5.8858642578125, -5.728759765625, -5.5716552734375, -5.41455078125, -5.2574462890625, -5.100341796875, -4.9432373046875, -4.7861328125, -4.6290283203125, -4.471923828125, -4.3148193359375, -4.15771484375, -4.0006103515625, -3.843505859375, -3.6864013671875, -3.529296875, -3.3721923828125, -3.215087890625, -3.0579833984375, -2.90087890625, -2.7437744140625, -2.586669921875, -2.4295654296875, -2.2724609375, -2.1153564453125, -1.958251953125, -1.8011474609375, -1.64404296875, -1.4869384765625, -1.329833984375, -1.1727294921875, -1.015625, -0.8585205078125, -0.701416015625, -0.5443115234375, -0.38720703125, -0.2301025390625, -0.072998046875, 0.0841064453125, 0.2412109375, 0.3983154296875, 0.555419921875, 0.7125244140625, 0.86962890625, 1.0267333984375, 1.183837890625, 1.3409423828125, 1.498046875, 1.6551513671875, 1.812255859375, 1.9693603515625, 2.12646484375, 2.2835693359375, 2.440673828125, 2.5977783203125, 2.7548828125, 2.9119873046875, 3.069091796875, 3.2261962890625, 3.38330078125, 3.5404052734375, 3.697509765625, 3.8546142578125, 4.01171875]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 4.0, 1.0, 4.0, 5.0, 3.0, 6.0, 9.0, 7.0, 16.0, 6.0, 30.0, 18.0, 20.0, 23.0, 22.0, 41.0, 23.0, 39.0, 58.0, 83.0, 197.0, 1032.0, 291205.0, 753598.0, 1439.0, 233.0, 86.0, 48.0, 44.0, 38.0, 38.0, 25.0, 32.0, 16.0, 20.0, 15.0, 10.0, 11.0, 15.0, 6.0, 11.0, 1.0, 5.0, 4.0, 4.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-16.640625, -16.166015625, -15.69140625, -15.216796875, -14.7421875, -14.267578125, -13.79296875, -13.318359375, -12.84375, -12.369140625, -11.89453125, -11.419921875, -10.9453125, -10.470703125, -9.99609375, -9.521484375, -9.046875, -8.572265625, -8.09765625, -7.623046875, -7.1484375, -6.673828125, -6.19921875, -5.724609375, -5.25, -4.775390625, -4.30078125, -3.826171875, -3.3515625, -2.876953125, -2.40234375, -1.927734375, -1.453125, -0.978515625, -0.50390625, -0.029296875, 0.4453125, 0.919921875, 1.39453125, 1.869140625, 2.34375, 2.818359375, 3.29296875, 3.767578125, 4.2421875, 4.716796875, 5.19140625, 5.666015625, 6.140625, 6.615234375, 7.08984375, 7.564453125, 8.0390625, 8.513671875, 8.98828125, 9.462890625, 9.9375, 10.412109375, 10.88671875, 11.361328125, 11.8359375, 12.310546875, 12.78515625, 13.259765625, 13.734375]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 0.0, 3.0, 7.0, 10.0, 2.0, 3.0, 14.0, 13.0, 10.0, 26.0, 15.0, 33.0, 15.0, 37.0, 31.0, 36.0, 35.0, 41.0, 40.0, 46.0, 56.0, 37.0, 53.0, 57.0, 44.0, 46.0, 39.0, 29.0, 38.0, 35.0, 23.0, 30.0, 11.0, 25.0, 14.0, 10.0, 10.0, 9.0, 4.0, 3.0, 3.0, 2.0, 4.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.734375, -4.601226806640625, -4.46807861328125, -4.334930419921875, -4.2017822265625, -4.068634033203125, -3.93548583984375, -3.802337646484375, -3.669189453125, -3.536041259765625, -3.40289306640625, -3.269744873046875, -3.1365966796875, -3.003448486328125, -2.87030029296875, -2.737152099609375, -2.60400390625, -2.470855712890625, -2.33770751953125, -2.204559326171875, -2.0714111328125, -1.938262939453125, -1.80511474609375, -1.671966552734375, -1.538818359375, -1.405670166015625, -1.27252197265625, -1.139373779296875, -1.0062255859375, -0.873077392578125, -0.73992919921875, -0.606781005859375, -0.4736328125, -0.340484619140625, -0.20733642578125, -0.074188232421875, 0.0589599609375, 0.192108154296875, 0.32525634765625, 0.458404541015625, 0.591552734375, 0.724700927734375, 0.85784912109375, 0.990997314453125, 1.1241455078125, 1.257293701171875, 1.39044189453125, 1.523590087890625, 1.65673828125, 1.789886474609375, 1.92303466796875, 2.056182861328125, 2.1893310546875, 2.322479248046875, 2.45562744140625, 2.588775634765625, 2.721923828125, 2.855072021484375, 2.98822021484375, 3.121368408203125, 3.2545166015625, 3.387664794921875, 3.52081298828125, 3.653961181640625, 3.787109375]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 6.0, 8.0, 15.0, 23.0, 21.0, 43.0, 72.0, 135.0, 345.0, 1568.0, 11131.0, 511364.0, 510368.0, 11083.0, 1574.0, 433.0, 151.0, 71.0, 51.0, 31.0, 13.0, 12.0, 9.0, 6.0, 7.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-2.6953125, -2.622467041015625, -2.54962158203125, -2.476776123046875, -2.4039306640625, -2.331085205078125, -2.25823974609375, -2.185394287109375, -2.112548828125, -2.039703369140625, -1.96685791015625, -1.894012451171875, -1.8211669921875, -1.748321533203125, -1.67547607421875, -1.602630615234375, -1.52978515625, -1.456939697265625, -1.38409423828125, -1.311248779296875, -1.2384033203125, -1.165557861328125, -1.09271240234375, -1.019866943359375, -0.947021484375, -0.874176025390625, -0.80133056640625, -0.728485107421875, -0.6556396484375, -0.582794189453125, -0.50994873046875, -0.437103271484375, -0.3642578125, -0.291412353515625, -0.21856689453125, -0.145721435546875, -0.0728759765625, -3.0517578125e-05, 0.07281494140625, 0.145660400390625, 0.218505859375, 0.291351318359375, 0.36419677734375, 0.437042236328125, 0.5098876953125, 0.582733154296875, 0.65557861328125, 0.728424072265625, 0.80126953125, 0.874114990234375, 0.94696044921875, 1.019805908203125, 1.0926513671875, 1.165496826171875, 1.23834228515625, 1.311187744140625, 1.384033203125, 1.456878662109375, 1.52972412109375, 1.602569580078125, 1.6754150390625, 1.748260498046875, 1.82110595703125, 1.893951416015625, 1.966796875]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 6.0, 3.0, 3.0, 7.0, 18.0, 19.0, 26.0, 47.0, 62.0, 72.0, 117.0, 119.0, 120.0, 87.0, 80.0, 54.0, 50.0, 30.0, 20.0, 23.0, 12.0, 7.0, 5.0, 4.0, 3.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00016820430755615234, -0.00016312859952449799, -0.00015805289149284363, -0.00015297718346118927, -0.0001479014754295349, -0.00014282576739788055, -0.0001377500593662262, -0.00013267435133457184, -0.00012759864330291748, -0.00012252293527126312, -0.00011744722723960876, -0.0001123715192079544, -0.00010729581117630005, -0.00010222010314464569, -9.714439511299133e-05, -9.206868708133698e-05, -8.699297904968262e-05, -8.191727101802826e-05, -7.68415629863739e-05, -7.176585495471954e-05, -6.669014692306519e-05, -6.161443889141083e-05, -5.653873085975647e-05, -5.146302282810211e-05, -4.6387314796447754e-05, -4.1311606764793396e-05, -3.623589873313904e-05, -3.116019070148468e-05, -2.6084482669830322e-05, -2.1008774638175964e-05, -1.5933066606521606e-05, -1.0857358574867249e-05, -5.781650543212891e-06, -7.059425115585327e-07, 4.369765520095825e-06, 9.445473551750183e-06, 1.4521181583404541e-05, 1.95968896150589e-05, 2.4672597646713257e-05, 2.9748305678367615e-05, 3.482401371002197e-05, 3.989972174167633e-05, 4.497542977333069e-05, 5.0051137804985046e-05, 5.5126845836639404e-05, 6.020255386829376e-05, 6.527826189994812e-05, 7.035396993160248e-05, 7.542967796325684e-05, 8.05053859949112e-05, 8.558109402656555e-05, 9.065680205821991e-05, 9.573251008987427e-05, 0.00010080821812152863, 0.00010588392615318298, 0.00011095963418483734, 0.0001160353422164917, 0.00012111105024814606, 0.00012618675827980042, 0.00013126246631145477, 0.00013633817434310913, 0.0001414138823747635, 0.00014648959040641785, 0.0001515652984380722, 0.00015664100646972656]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 7.0, 2.0, 2.0, 3.0, 5.0, 5.0, 6.0, 11.0, 16.0, 20.0, 20.0, 33.0, 76.0, 113.0, 215.0, 424.0, 924.0, 2526.0, 9247.0, 59905.0, 533726.0, 389010.0, 40970.0, 7393.0, 2179.0, 833.0, 386.0, 204.0, 124.0, 55.0, 32.0, 21.0, 13.0, 12.0, 9.0, 9.0, 4.0, 8.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-1.2900390625, -1.2519989013671875, -1.213958740234375, -1.1759185791015625, -1.13787841796875, -1.0998382568359375, -1.061798095703125, -1.0237579345703125, -0.9857177734375, -0.9476776123046875, -0.909637451171875, -0.8715972900390625, -0.83355712890625, -0.7955169677734375, -0.757476806640625, -0.7194366455078125, -0.681396484375, -0.6433563232421875, -0.605316162109375, -0.5672760009765625, -0.52923583984375, -0.4911956787109375, -0.453155517578125, -0.4151153564453125, -0.3770751953125, -0.3390350341796875, -0.300994873046875, -0.2629547119140625, -0.22491455078125, -0.1868743896484375, -0.148834228515625, -0.1107940673828125, -0.07275390625, -0.0347137451171875, 0.003326416015625, 0.0413665771484375, 0.07940673828125, 0.1174468994140625, 0.155487060546875, 0.1935272216796875, 0.2315673828125, 0.2696075439453125, 0.307647705078125, 0.3456878662109375, 0.38372802734375, 0.4217681884765625, 0.459808349609375, 0.4978485107421875, 0.535888671875, 0.5739288330078125, 0.611968994140625, 0.6500091552734375, 0.68804931640625, 0.7260894775390625, 0.764129638671875, 0.8021697998046875, 0.8402099609375, 0.8782501220703125, 0.916290283203125, 0.9543304443359375, 0.99237060546875, 1.0304107666015625, 1.068450927734375, 1.1064910888671875, 1.14453125]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [5.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 3.0, 9.0, 13.0, 15.0, 20.0, 27.0, 35.0, 58.0, 81.0, 120.0, 118.0, 120.0, 113.0, 70.0, 51.0, 44.0, 27.0, 23.0, 7.0, 14.0, 4.0, 11.0, 3.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.390380859375, -0.3740882873535156, -0.35779571533203125, -0.3415031433105469, -0.3252105712890625, -0.3089179992675781, -0.29262542724609375, -0.2763328552246094, -0.260040283203125, -0.24374771118164062, -0.22745513916015625, -0.21116256713867188, -0.1948699951171875, -0.17857742309570312, -0.16228485107421875, -0.14599227905273438, -0.12969970703125, -0.11340713500976562, -0.09711456298828125, -0.08082199096679688, -0.0645294189453125, -0.048236846923828125, -0.03194427490234375, -0.015651702880859375, 0.000640869140625, 0.016933441162109375, 0.03322601318359375, 0.049518585205078125, 0.0658111572265625, 0.08210372924804688, 0.09839630126953125, 0.11468887329101562, 0.1309814453125, 0.14727401733398438, 0.16356658935546875, 0.17985916137695312, 0.1961517333984375, 0.21244430541992188, 0.22873687744140625, 0.24502944946289062, 0.261322021484375, 0.2776145935058594, 0.29390716552734375, 0.3101997375488281, 0.3264923095703125, 0.3427848815917969, 0.35907745361328125, 0.3753700256347656, 0.39166259765625, 0.4079551696777344, 0.42424774169921875, 0.4405403137207031, 0.4568328857421875, 0.4731254577636719, 0.48941802978515625, 0.5057106018066406, 0.522003173828125, 0.5382957458496094, 0.5545883178710938, 0.5708808898925781, 0.5871734619140625, 0.6034660339355469, 0.6197586059570312, 0.6360511779785156, 0.65234375]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 2.0, 5.0, 10.0, 15.0, 32.0, 111.0, 174.0, 230.0, 205.0, 130.0, 59.0, 23.0, 10.0, 4.0, 3.0, 0.0, 1.0], "bins": [-25.567317962646484, -25.098392486572266, -24.629467010498047, -24.160541534423828, -23.69161605834961, -23.22269058227539, -22.753765106201172, -22.284839630126953, -21.815914154052734, -21.346988677978516, -20.878063201904297, -20.409137725830078, -19.94021224975586, -19.47128677368164, -19.002361297607422, -18.533435821533203, -18.064510345458984, -17.595584869384766, -17.126659393310547, -16.657733917236328, -16.18880844116211, -15.71988296508789, -15.250957489013672, -14.782032012939453, -14.31310749053955, -13.844182014465332, -13.375256538391113, -12.906331062316895, -12.437405586242676, -11.968480110168457, -11.499554634094238, -11.03062915802002, -10.561702728271484, -10.092777252197266, -9.623851776123047, -9.154926300048828, -8.68600082397461, -8.21707534790039, -7.748149871826172, -7.279224395751953, -6.810299873352051, -6.341374397277832, -5.872448921203613, -5.4035234451293945, -4.934597969055176, -4.465672492980957, -3.9967472553253174, -3.5278217792510986, -3.058896064758301, -2.589970588684082, -2.1210451126098633, -1.652119755744934, -1.1831942796707153, -0.7142689228057861, -0.24534344673156738, 0.22358202934265137, 0.6925075054168701, 1.1614329814910889, 1.6303584575653076, 2.0992836952209473, 2.568209171295166, 3.0371346473693848, 3.5060601234436035, 3.9749855995178223, 4.443911075592041]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 6.0, 2.0, 9.0, 12.0, 8.0, 14.0, 12.0, 18.0, 14.0, 18.0, 24.0, 28.0, 36.0, 28.0, 41.0, 37.0, 40.0, 42.0, 44.0, 39.0, 38.0, 48.0, 45.0, 37.0, 55.0, 36.0, 28.0, 36.0, 20.0, 31.0, 29.0, 26.0, 19.0, 15.0, 12.0, 11.0, 8.0, 11.0, 8.0, 3.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0], "bins": [-6.464783668518066, -6.28306770324707, -6.101352214813232, -5.919636249542236, -5.73792028427124, -5.556204795837402, -5.374488830566406, -5.19277286529541, -5.011057376861572, -4.829341411590576, -4.647625923156738, -4.465909957885742, -4.284193992614746, -4.102478504180908, -3.920762538909912, -3.739046812057495, -3.557330846786499, -3.375615119934082, -3.193899154663086, -3.012183427810669, -2.830467700958252, -2.648751735687256, -2.467036008834839, -2.285320281982422, -2.103604316711426, -1.9218884706497192, -1.7401727437973022, -1.5584568977355957, -1.3767411708831787, -1.1950253248214722, -1.0133094787597656, -0.8315937519073486, -0.6498780250549316, -0.4681622385978699, -0.2864464223384857, -0.10473060607910156, 0.0769851803779602, 0.258700966835022, 0.4404168128967285, 0.6221325397491455, 0.803848385810852, 0.9855641722679138, 1.1672799587249756, 1.3489958047866821, 1.5307116508483887, 1.7124273777008057, 1.8941432237625122, 2.0758590698242188, 2.2575747966766357, 2.4392905235290527, 2.621006488800049, 2.802722215652466, 2.984437942504883, 3.166153907775879, 3.347869634628296, 3.529585361480713, 3.711301326751709, 3.893017053604126, 4.074732780456543, 4.256448745727539, 4.438164710998535, 4.619880199432373, 4.801596164703369, 4.983311653137207, 5.165027618408203]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 8.0, 7.0, 4.0, 8.0, 9.0, 11.0, 17.0, 18.0, 24.0, 30.0, 38.0, 72.0, 88.0, 146.0, 210.0, 356.0, 590.0, 1460.0, 3671.0, 12685.0, 58948.0, 346837.0, 1573494.0, 1685918.0, 413126.0, 72496.0, 16197.0, 4838.0, 1577.0, 658.0, 332.0, 141.0, 100.0, 60.0, 27.0, 25.0, 11.0, 14.0, 11.0, 3.0, 7.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.8046875, -3.68597412109375, -3.5672607421875, -3.44854736328125, -3.329833984375, -3.21112060546875, -3.0924072265625, -2.97369384765625, -2.85498046875, -2.73626708984375, -2.6175537109375, -2.49884033203125, -2.380126953125, -2.26141357421875, -2.1427001953125, -2.02398681640625, -1.9052734375, -1.78656005859375, -1.6678466796875, -1.54913330078125, -1.430419921875, -1.31170654296875, -1.1929931640625, -1.07427978515625, -0.95556640625, -0.83685302734375, -0.7181396484375, -0.59942626953125, -0.480712890625, -0.36199951171875, -0.2432861328125, -0.12457275390625, -0.005859375, 0.11285400390625, 0.2315673828125, 0.35028076171875, 0.468994140625, 0.58770751953125, 0.7064208984375, 0.82513427734375, 0.94384765625, 1.06256103515625, 1.1812744140625, 1.29998779296875, 1.418701171875, 1.53741455078125, 1.6561279296875, 1.77484130859375, 1.8935546875, 2.01226806640625, 2.1309814453125, 2.24969482421875, 2.368408203125, 2.48712158203125, 2.6058349609375, 2.72454833984375, 2.84326171875, 2.96197509765625, 3.0806884765625, 3.19940185546875, 3.318115234375, 3.43682861328125, 3.5555419921875, 3.67425537109375, 3.79296875]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 4.0, 12.0, 7.0, 12.0, 12.0, 23.0, 38.0, 29.0, 36.0, 45.0, 43.0, 53.0, 52.0, 60.0, 62.0, 62.0, 63.0, 66.0, 58.0, 41.0, 42.0, 32.0, 30.0, 30.0, 29.0, 11.0, 20.0, 7.0, 7.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-4.4296875, -4.31591796875, -4.2021484375, -4.08837890625, -3.974609375, -3.86083984375, -3.7470703125, -3.63330078125, -3.51953125, -3.40576171875, -3.2919921875, -3.17822265625, -3.064453125, -2.95068359375, -2.8369140625, -2.72314453125, -2.609375, -2.49560546875, -2.3818359375, -2.26806640625, -2.154296875, -2.04052734375, -1.9267578125, -1.81298828125, -1.69921875, -1.58544921875, -1.4716796875, -1.35791015625, -1.244140625, -1.13037109375, -1.0166015625, -0.90283203125, -0.7890625, -0.67529296875, -0.5615234375, -0.44775390625, -0.333984375, -0.22021484375, -0.1064453125, 0.00732421875, 0.12109375, 0.23486328125, 0.3486328125, 0.46240234375, 0.576171875, 0.68994140625, 0.8037109375, 0.91748046875, 1.03125, 1.14501953125, 1.2587890625, 1.37255859375, 1.486328125, 1.60009765625, 1.7138671875, 1.82763671875, 1.94140625, 2.05517578125, 2.1689453125, 2.28271484375, 2.396484375, 2.51025390625, 2.6240234375, 2.73779296875, 2.8515625]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 7.0, 12.0, 12.0, 32.0, 39.0, 60.0, 117.0, 274.0, 783.0, 3179.0, 27585.0, 1230181.0, 2863241.0, 61169.0, 5464.0, 1252.0, 422.0, 188.0, 99.0, 53.0, 32.0, 21.0, 21.0, 12.0, 4.0, 6.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.49609375, -5.26824951171875, -5.0404052734375, -4.81256103515625, -4.584716796875, -4.35687255859375, -4.1290283203125, -3.90118408203125, -3.67333984375, -3.44549560546875, -3.2176513671875, -2.98980712890625, -2.761962890625, -2.53411865234375, -2.3062744140625, -2.07843017578125, -1.8505859375, -1.62274169921875, -1.3948974609375, -1.16705322265625, -0.939208984375, -0.71136474609375, -0.4835205078125, -0.25567626953125, -0.02783203125, 0.20001220703125, 0.4278564453125, 0.65570068359375, 0.883544921875, 1.11138916015625, 1.3392333984375, 1.56707763671875, 1.794921875, 2.02276611328125, 2.2506103515625, 2.47845458984375, 2.706298828125, 2.93414306640625, 3.1619873046875, 3.38983154296875, 3.61767578125, 3.84552001953125, 4.0733642578125, 4.30120849609375, 4.529052734375, 4.75689697265625, 4.9847412109375, 5.21258544921875, 5.4404296875, 5.66827392578125, 5.8961181640625, 6.12396240234375, 6.351806640625, 6.57965087890625, 6.8074951171875, 7.03533935546875, 7.26318359375, 7.49102783203125, 7.7188720703125, 7.94671630859375, 8.174560546875, 8.40240478515625, 8.6302490234375, 8.85809326171875, 9.0859375]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 3.0, 3.0, 7.0, 8.0, 6.0, 15.0, 26.0, 32.0, 71.0, 102.0, 163.0, 245.0, 425.0, 547.0, 685.0, 638.0, 450.0, 264.0, 144.0, 98.0, 56.0, 35.0, 19.0, 14.0, 5.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.21484375, -2.15740966796875, -2.0999755859375, -2.04254150390625, -1.985107421875, -1.92767333984375, -1.8702392578125, -1.81280517578125, -1.75537109375, -1.69793701171875, -1.6405029296875, -1.58306884765625, -1.525634765625, -1.46820068359375, -1.4107666015625, -1.35333251953125, -1.2958984375, -1.23846435546875, -1.1810302734375, -1.12359619140625, -1.066162109375, -1.00872802734375, -0.9512939453125, -0.89385986328125, -0.83642578125, -0.77899169921875, -0.7215576171875, -0.66412353515625, -0.606689453125, -0.54925537109375, -0.4918212890625, -0.43438720703125, -0.376953125, -0.31951904296875, -0.2620849609375, -0.20465087890625, -0.147216796875, -0.08978271484375, -0.0323486328125, 0.02508544921875, 0.08251953125, 0.13995361328125, 0.1973876953125, 0.25482177734375, 0.312255859375, 0.36968994140625, 0.4271240234375, 0.48455810546875, 0.5419921875, 0.59942626953125, 0.6568603515625, 0.71429443359375, 0.771728515625, 0.82916259765625, 0.8865966796875, 0.94403076171875, 1.00146484375, 1.05889892578125, 1.1163330078125, 1.17376708984375, 1.231201171875, 1.28863525390625, 1.3460693359375, 1.40350341796875, 1.4609375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 6.0, 15.0, 18.0, 29.0, 58.0, 64.0, 77.0, 94.0, 108.0, 112.0, 113.0, 84.0, 72.0, 53.0, 39.0, 16.0, 15.0, 12.0, 8.0, 9.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.956422805786133, -5.767917633056641, -5.579412460327148, -5.390907287597656, -5.202401638031006, -5.013896465301514, -4.8253912925720215, -4.636886119842529, -4.448380470275879, -4.259875297546387, -4.0713701248168945, -3.8828647136688232, -3.694359302520752, -3.5058541297912598, -3.3173489570617676, -3.1288437843322754, -2.940338611602783, -2.751833438873291, -2.5633280277252197, -2.3748228549957275, -2.1863174438476562, -1.997812271118164, -1.8093070983886719, -1.6208018064498901, -1.4322965145111084, -1.2437912225723267, -1.055285930633545, -0.8667807579040527, -0.678275465965271, -0.48977017402648926, -0.30126500129699707, -0.11275970935821533, 0.0757455825805664, 0.26425084471702576, 0.4527561068534851, 0.6412613391876221, 0.8297666311264038, 1.0182719230651855, 1.2067770957946777, 1.3952823877334595, 1.5837876796722412, 1.772292971611023, 1.9607982635498047, 2.149303436279297, 2.337808609008789, 2.5263140201568604, 2.7148191928863525, 2.903324604034424, 3.091829776763916, 3.280334949493408, 3.4688403606414795, 3.6573455333709717, 3.845850944519043, 4.034356117248535, 4.222861289978027, 4.4113664627075195, 4.599871635437012, 4.788376808166504, 4.976881980895996, 5.165387153625488, 5.353892803192139, 5.542397975921631, 5.730903148651123, 5.919408321380615, 6.107913970947266]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 7.0, 2.0, 16.0, 10.0, 16.0, 17.0, 15.0, 26.0, 29.0, 24.0, 28.0, 43.0, 44.0, 39.0, 48.0, 54.0, 49.0, 56.0, 59.0, 53.0, 49.0, 47.0, 43.0, 41.0, 42.0, 29.0, 29.0, 18.0, 15.0, 8.0, 9.0, 10.0, 4.0, 9.0, 7.0, 7.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.940107822418213, -2.830690383911133, -2.7212727069854736, -2.6118552684783936, -2.5024375915527344, -2.3930201530456543, -2.283602476119995, -2.174185037612915, -2.064767360687256, -1.9553498029708862, -1.8459322452545166, -1.736514687538147, -1.6270971298217773, -1.5176796913146973, -1.408262014389038, -1.298844575881958, -1.1894270181655884, -1.0800094604492188, -0.9705919027328491, -0.8611743450164795, -0.7517567873001099, -0.642339289188385, -0.5329217314720154, -0.42350417375564575, -0.3140866160392761, -0.2046690583229065, -0.09525151550769806, 0.014166027307510376, 0.12358358502388, 0.23300111293792725, 0.3424186706542969, 0.4518362283706665, 0.5612537860870361, 0.6706713438034058, 0.7800889015197754, 0.889506459236145, 0.9989240169525146, 1.1083414554595947, 1.217759132385254, 1.327176570892334, 1.4365942478179932, 1.5460118055343628, 1.6554293632507324, 1.764846920967102, 1.8742644786834717, 1.9836819171905518, 2.093099594116211, 2.202517032623291, 2.311934471130371, 2.421351909637451, 2.5307695865631104, 2.6401870250701904, 2.7496047019958496, 2.8590221405029297, 2.968439817428589, 3.077857255935669, 3.187274932861328, 3.296692371368408, 3.4061100482940674, 3.5155274868011475, 3.6249451637268066, 3.7343626022338867, 3.843780279159546, 3.953197717666626, 4.062615394592285]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 7.0, 7.0, 4.0, 10.0, 19.0, 22.0, 34.0, 54.0, 73.0, 144.0, 191.0, 383.0, 735.0, 1536.0, 4113.0, 14228.0, 77519.0, 475158.0, 396329.0, 59595.0, 11853.0, 3564.0, 1467.0, 646.0, 339.0, 203.0, 119.0, 63.0, 40.0, 36.0, 16.0, 19.0, 12.0, 10.0, 3.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.89404296875, -0.8641738891601562, -0.8343048095703125, -0.8044357299804688, -0.774566650390625, -0.7446975708007812, -0.7148284912109375, -0.6849594116210938, -0.65509033203125, -0.6252212524414062, -0.5953521728515625, -0.5654830932617188, -0.535614013671875, -0.5057449340820312, -0.4758758544921875, -0.44600677490234375, -0.4161376953125, -0.38626861572265625, -0.3563995361328125, -0.32653045654296875, -0.296661376953125, -0.26679229736328125, -0.2369232177734375, -0.20705413818359375, -0.17718505859375, -0.14731597900390625, -0.1174468994140625, -0.08757781982421875, -0.057708740234375, -0.02783966064453125, 0.0020294189453125, 0.03189849853515625, 0.061767578125, 0.09163665771484375, 0.1215057373046875, 0.15137481689453125, 0.181243896484375, 0.21111297607421875, 0.2409820556640625, 0.27085113525390625, 0.30072021484375, 0.33058929443359375, 0.3604583740234375, 0.39032745361328125, 0.420196533203125, 0.45006561279296875, 0.4799346923828125, 0.5098037719726562, 0.5396728515625, 0.5695419311523438, 0.5994110107421875, 0.6292800903320312, 0.659149169921875, 0.6890182495117188, 0.7188873291015625, 0.7487564086914062, 0.77862548828125, 0.8084945678710938, 0.8383636474609375, 0.8682327270507812, 0.898101806640625, 0.9279708862304688, 0.9578399658203125, 0.9877090454101562, 1.017578125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 4.0, 4.0, 5.0, 6.0, 14.0, 13.0, 17.0, 17.0, 29.0, 23.0, 26.0, 40.0, 40.0, 55.0, 70.0, 55.0, 62.0, 69.0, 66.0, 48.0, 66.0, 56.0, 44.0, 33.0, 38.0, 25.0, 14.0, 17.0, 16.0, 7.0, 12.0, 5.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.384765625, -2.305694580078125, -2.22662353515625, -2.147552490234375, -2.0684814453125, -1.989410400390625, -1.91033935546875, -1.831268310546875, -1.752197265625, -1.673126220703125, -1.59405517578125, -1.514984130859375, -1.4359130859375, -1.356842041015625, -1.27777099609375, -1.198699951171875, -1.11962890625, -1.040557861328125, -0.96148681640625, -0.882415771484375, -0.8033447265625, -0.724273681640625, -0.64520263671875, -0.566131591796875, -0.487060546875, -0.407989501953125, -0.32891845703125, -0.249847412109375, -0.1707763671875, -0.091705322265625, -0.01263427734375, 0.066436767578125, 0.1455078125, 0.224578857421875, 0.30364990234375, 0.382720947265625, 0.4617919921875, 0.540863037109375, 0.61993408203125, 0.699005126953125, 0.778076171875, 0.857147216796875, 0.93621826171875, 1.015289306640625, 1.0943603515625, 1.173431396484375, 1.25250244140625, 1.331573486328125, 1.41064453125, 1.489715576171875, 1.56878662109375, 1.647857666015625, 1.7269287109375, 1.805999755859375, 1.88507080078125, 1.964141845703125, 2.043212890625, 2.122283935546875, 2.20135498046875, 2.280426025390625, 2.3594970703125, 2.438568115234375, 2.51763916015625, 2.596710205078125, 2.67578125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 5.0, 2.0, 3.0, 16.0, 13.0, 20.0, 36.0, 43.0, 64.0, 85.0, 134.0, 186.0, 292.0, 449.0, 660.0, 1018.0, 1697.0, 2762.0, 4760.0, 8155.0, 14503.0, 25756.0, 46362.0, 80455.0, 133482.0, 186912.0, 193619.0, 142246.0, 87785.0, 50552.0, 28363.0, 15705.0, 9046.0, 5199.0, 3043.0, 1774.0, 1157.0, 724.0, 474.0, 314.0, 196.0, 148.0, 93.0, 69.0, 50.0, 42.0, 28.0, 19.0, 18.0, 8.0, 6.0, 4.0, 6.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1903076171875, -0.1835308074951172, -0.17675399780273438, -0.16997718811035156, -0.16320037841796875, -0.15642356872558594, -0.14964675903320312, -0.1428699493408203, -0.1360931396484375, -0.1293163299560547, -0.12253952026367188, -0.11576271057128906, -0.10898590087890625, -0.10220909118652344, -0.09543228149414062, -0.08865547180175781, -0.081878662109375, -0.07510185241699219, -0.06832504272460938, -0.06154823303222656, -0.05477142333984375, -0.04799461364746094, -0.041217803955078125, -0.03444099426269531, -0.0276641845703125, -0.020887374877929688, -0.014110565185546875, -0.0073337554931640625, -0.00055694580078125, 0.0062198638916015625, 0.012996673583984375, 0.019773483276367188, 0.02655029296875, 0.03332710266113281, 0.040103912353515625, 0.04688072204589844, 0.05365753173828125, 0.06043434143066406, 0.06721115112304688, 0.07398796081542969, 0.0807647705078125, 0.08754158020019531, 0.09431838989257812, 0.10109519958496094, 0.10787200927734375, 0.11464881896972656, 0.12142562866210938, 0.1282024383544922, 0.134979248046875, 0.1417560577392578, 0.14853286743164062, 0.15530967712402344, 0.16208648681640625, 0.16886329650878906, 0.17564010620117188, 0.1824169158935547, 0.1891937255859375, 0.1959705352783203, 0.20274734497070312, 0.20952415466308594, 0.21630096435546875, 0.22307777404785156, 0.22985458374023438, 0.2366313934326172, 0.243408203125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 6.0, 1.0, 3.0, 7.0, 13.0, 13.0, 8.0, 22.0, 24.0, 25.0, 36.0, 34.0, 55.0, 52.0, 48.0, 45.0, 49.0, 57.0, 52.0, 46.0, 61.0, 61.0, 39.0, 46.0, 30.0, 38.0, 21.0, 24.0, 19.0, 13.0, 11.0, 15.0, 12.0, 2.0, 2.0, 5.0, 2.0, 3.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.51953125, -3.3895263671875, -3.259521484375, -3.1295166015625, -2.99951171875, -2.8695068359375, -2.739501953125, -2.6094970703125, -2.4794921875, -2.3494873046875, -2.219482421875, -2.0894775390625, -1.95947265625, -1.8294677734375, -1.699462890625, -1.5694580078125, -1.439453125, -1.3094482421875, -1.179443359375, -1.0494384765625, -0.91943359375, -0.7894287109375, -0.659423828125, -0.5294189453125, -0.3994140625, -0.2694091796875, -0.139404296875, -0.0093994140625, 0.12060546875, 0.2506103515625, 0.380615234375, 0.5106201171875, 0.640625, 0.7706298828125, 0.900634765625, 1.0306396484375, 1.16064453125, 1.2906494140625, 1.420654296875, 1.5506591796875, 1.6806640625, 1.8106689453125, 1.940673828125, 2.0706787109375, 2.20068359375, 2.3306884765625, 2.460693359375, 2.5906982421875, 2.720703125, 2.8507080078125, 2.980712890625, 3.1107177734375, 3.24072265625, 3.3707275390625, 3.500732421875, 3.6307373046875, 3.7607421875, 3.8907470703125, 4.020751953125, 4.1507568359375, 4.28076171875, 4.4107666015625, 4.540771484375, 4.6707763671875, 4.80078125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 0.0, 8.0, 2.0, 8.0, 17.0, 17.0, 22.0, 34.0, 53.0, 74.0, 101.0, 128.0, 241.0, 444.0, 1074.0, 2435.0, 7301.0, 25680.0, 109352.0, 388913.0, 373767.0, 103080.0, 24270.0, 6992.0, 2409.0, 970.0, 462.0, 246.0, 156.0, 95.0, 58.0, 35.0, 30.0, 30.0, 11.0, 11.0, 11.0, 7.0, 5.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.053436279296875, -0.051592350006103516, -0.04974842071533203, -0.04790449142456055, -0.04606056213378906, -0.04421663284301758, -0.042372703552246094, -0.04052877426147461, -0.038684844970703125, -0.03684091567993164, -0.034996986389160156, -0.03315305709838867, -0.03130912780761719, -0.029465198516845703, -0.02762126922607422, -0.025777339935302734, -0.02393341064453125, -0.022089481353759766, -0.02024555206298828, -0.018401622772216797, -0.016557693481445312, -0.014713764190673828, -0.012869834899902344, -0.01102590560913086, -0.009181976318359375, -0.007338047027587891, -0.005494117736816406, -0.003650188446044922, -0.0018062591552734375, 3.7670135498046875e-05, 0.0018815994262695312, 0.0037255287170410156, 0.0055694580078125, 0.007413387298583984, 0.009257316589355469, 0.011101245880126953, 0.012945175170898438, 0.014789104461669922, 0.016633033752441406, 0.01847696304321289, 0.020320892333984375, 0.02216482162475586, 0.024008750915527344, 0.025852680206298828, 0.027696609497070312, 0.029540538787841797, 0.03138446807861328, 0.033228397369384766, 0.03507232666015625, 0.036916255950927734, 0.03876018524169922, 0.0406041145324707, 0.04244804382324219, 0.04429197311401367, 0.046135902404785156, 0.04797983169555664, 0.049823760986328125, 0.05166769027709961, 0.053511619567871094, 0.05535554885864258, 0.05719947814941406, 0.05904340744018555, 0.06088733673095703, 0.06273126602172852, 0.0645751953125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 7.0, 7.0, 6.0, 6.0, 14.0, 13.0, 16.0, 19.0, 33.0, 28.0, 33.0, 59.0, 51.0, 79.0, 74.0, 79.0, 96.0, 76.0, 69.0, 55.0, 38.0, 37.0, 27.0, 23.0, 10.0, 13.0, 8.0, 8.0, 3.0, 6.0, 3.0, 5.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.8564205169677734e-05, -3.7445686757564545e-05, -3.6327168345451355e-05, -3.5208649933338165e-05, -3.4090131521224976e-05, -3.2971613109111786e-05, -3.1853094696998596e-05, -3.0734576284885406e-05, -2.9616057872772217e-05, -2.8497539460659027e-05, -2.7379021048545837e-05, -2.6260502636432648e-05, -2.5141984224319458e-05, -2.402346581220627e-05, -2.290494740009308e-05, -2.178642898797989e-05, -2.06679105758667e-05, -1.954939216375351e-05, -1.843087375164032e-05, -1.731235533952713e-05, -1.619383692741394e-05, -1.507531851530075e-05, -1.3956800103187561e-05, -1.2838281691074371e-05, -1.1719763278961182e-05, -1.0601244866847992e-05, -9.482726454734802e-06, -8.364208042621613e-06, -7.245689630508423e-06, -6.127171218395233e-06, -5.0086528062820435e-06, -3.890134394168854e-06, -2.771615982055664e-06, -1.6530975699424744e-06, -5.345791578292847e-07, 5.83939254283905e-07, 1.7024576663970947e-06, 2.8209760785102844e-06, 3.939494490623474e-06, 5.058012902736664e-06, 6.1765313148498535e-06, 7.295049726963043e-06, 8.413568139076233e-06, 9.532086551189423e-06, 1.0650604963302612e-05, 1.1769123375415802e-05, 1.2887641787528992e-05, 1.4006160199642181e-05, 1.5124678611755371e-05, 1.624319702386856e-05, 1.736171543598175e-05, 1.848023384809494e-05, 1.959875226020813e-05, 2.071727067232132e-05, 2.183578908443451e-05, 2.29543074965477e-05, 2.407282590866089e-05, 2.519134432077408e-05, 2.6309862732887268e-05, 2.7428381145000458e-05, 2.8546899557113647e-05, 2.9665417969226837e-05, 3.078393638134003e-05, 3.1902454793453217e-05, 3.3020973205566406e-05]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 5.0, 4.0, 3.0, 7.0, 8.0, 9.0, 26.0, 15.0, 46.0, 73.0, 121.0, 301.0, 567.0, 1286.0, 3625.0, 12683.0, 51074.0, 218736.0, 473928.0, 217270.0, 50340.0, 12302.0, 3627.0, 1362.0, 550.0, 266.0, 137.0, 66.0, 36.0, 18.0, 24.0, 7.0, 11.0, 4.0, 8.0, 3.0, 4.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.053253173828125, -0.05138444900512695, -0.049515724182128906, -0.04764699935913086, -0.04577827453613281, -0.043909549713134766, -0.04204082489013672, -0.04017210006713867, -0.038303375244140625, -0.03643465042114258, -0.03456592559814453, -0.032697200775146484, -0.030828475952148438, -0.02895975112915039, -0.027091026306152344, -0.025222301483154297, -0.02335357666015625, -0.021484851837158203, -0.019616127014160156, -0.01774740219116211, -0.015878677368164062, -0.014009952545166016, -0.012141227722167969, -0.010272502899169922, -0.008403778076171875, -0.006535053253173828, -0.004666328430175781, -0.0027976036071777344, -0.0009288787841796875, 0.0009398460388183594, 0.0028085708618164062, 0.004677295684814453, 0.0065460205078125, 0.008414745330810547, 0.010283470153808594, 0.01215219497680664, 0.014020919799804688, 0.015889644622802734, 0.01775836944580078, 0.019627094268798828, 0.021495819091796875, 0.023364543914794922, 0.02523326873779297, 0.027101993560791016, 0.028970718383789062, 0.03083944320678711, 0.032708168029785156, 0.0345768928527832, 0.03644561767578125, 0.0383143424987793, 0.040183067321777344, 0.04205179214477539, 0.04392051696777344, 0.045789241790771484, 0.04765796661376953, 0.04952669143676758, 0.051395416259765625, 0.05326414108276367, 0.05513286590576172, 0.057001590728759766, 0.05887031555175781, 0.06073904037475586, 0.0626077651977539, 0.06447649002075195, 0.06634521484375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 11.0, 13.0, 15.0, 17.0, 29.0, 49.0, 41.0, 71.0, 78.0, 130.0, 110.0, 94.0, 75.0, 69.0, 55.0, 41.0, 30.0, 27.0, 11.0, 8.0, 6.0, 4.0, 3.0, 3.0, 5.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.020660400390625, -0.019962310791015625, -0.01926422119140625, -0.018566131591796875, -0.0178680419921875, -0.017169952392578125, -0.01647186279296875, -0.015773773193359375, -0.01507568359375, -0.014377593994140625, -0.01367950439453125, -0.012981414794921875, -0.0122833251953125, -0.011585235595703125, -0.01088714599609375, -0.010189056396484375, -0.009490966796875, -0.008792877197265625, -0.00809478759765625, -0.007396697998046875, -0.0066986083984375, -0.006000518798828125, -0.00530242919921875, -0.004604339599609375, -0.00390625, -0.003208160400390625, -0.00251007080078125, -0.001811981201171875, -0.0011138916015625, -0.000415802001953125, 0.00028228759765625, 0.000980377197265625, 0.001678466796875, 0.002376556396484375, 0.00307464599609375, 0.003772735595703125, 0.0044708251953125, 0.005168914794921875, 0.00586700439453125, 0.006565093994140625, 0.00726318359375, 0.007961273193359375, 0.00865936279296875, 0.009357452392578125, 0.0100555419921875, 0.010753631591796875, 0.01145172119140625, 0.012149810791015625, 0.012847900390625, 0.013545989990234375, 0.01424407958984375, 0.014942169189453125, 0.0156402587890625, 0.016338348388671875, 0.01703643798828125, 0.017734527587890625, 0.0184326171875, 0.019130706787109375, 0.01982879638671875, 0.020526885986328125, 0.0212249755859375, 0.021923065185546875, 0.02262115478515625, 0.023319244384765625, 0.024017333984375]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 13.0, 50.0, 180.0, 310.0, 290.0, 115.0, 41.0, 8.0, 6.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.463403701782227, -4.141867637634277, -3.820331573486328, -3.498795509338379, -3.1772594451904297, -2.8557233810424805, -2.5341875553131104, -2.212651491165161, -1.891115427017212, -1.5695793628692627, -1.2480432987213135, -0.9265073537826538, -0.6049712896347046, -0.28343522548675537, 0.0381007194519043, 0.3596367835998535, 0.6811728477478027, 1.002708911895752, 1.3242449760437012, 1.6457809209823608, 1.96731698513031, 2.288853168487549, 2.610388994216919, 2.931925058364868, 3.2534611225128174, 3.5749971866607666, 3.896533250808716, 4.218069076538086, 4.539605140686035, 4.861141204833984, 5.182677268981934, 5.504213333129883, 5.825749397277832, 6.147285461425781, 6.4688215255737305, 6.79035758972168, 7.111893653869629, 7.433429718017578, 7.754965782165527, 8.076501846313477, 8.398037910461426, 8.719573974609375, 9.041110038757324, 9.362646102905273, 9.684182167053223, 10.005718231201172, 10.327254295349121, 10.64879035949707, 10.970325469970703, 11.291861534118652, 11.613397598266602, 11.93493366241455, 12.2564697265625, 12.57800579071045, 12.899541854858398, 13.221077919006348, 13.542613983154297, 13.864150047302246, 14.185686111450195, 14.507222175598145, 14.828758239746094, 15.150294303894043, 15.471830368041992, 15.793366432189941, 16.11490249633789]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 6.0, 8.0, 7.0, 18.0, 22.0, 19.0, 30.0, 34.0, 26.0, 48.0, 53.0, 49.0, 52.0, 67.0, 75.0, 68.0, 70.0, 66.0, 46.0, 56.0, 48.0, 34.0, 31.0, 16.0, 11.0, 11.0, 7.0, 6.0, 12.0, 3.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.314805507659912, -2.233933687210083, -2.153061866760254, -2.072190046310425, -1.9913182258605957, -1.9104464054107666, -1.829574704170227, -1.748702883720398, -1.6678310632705688, -1.5869592428207397, -1.5060874223709106, -1.4252156019210815, -1.344343900680542, -1.263472080230713, -1.1826002597808838, -1.1017284393310547, -1.0208566188812256, -0.9399847984313965, -0.8591129779815674, -0.7782412171363831, -0.697369396686554, -0.6164975762367249, -0.5356258153915405, -0.4547539949417114, -0.3738821744918823, -0.2930103540420532, -0.2121385633945465, -0.1312667578458786, -0.05039495229721069, 0.030476868152618408, 0.11134865880012512, 0.19222044944763184, 0.27309250831604004, 0.35396432876586914, 0.43483611941337585, 0.5157079100608826, 0.5965797305107117, 0.6774515509605408, 0.7583233118057251, 0.8391951322555542, 0.9200669527053833, 1.0009387731552124, 1.0818105936050415, 1.1626824140548706, 1.2435541152954102, 1.3244259357452393, 1.4052977561950684, 1.4861695766448975, 1.5670413970947266, 1.6479132175445557, 1.7287850379943848, 1.8096568584442139, 1.890528678894043, 1.971400499343872, 2.052272319793701, 2.133143901824951, 2.2140159606933594, 2.2948877811431885, 2.3757596015930176, 2.4566314220428467, 2.537503242492676, 2.618375062942505, 2.699246883392334, 2.780118465423584, 2.860990285873413]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 4.0, 2.0, 3.0, 4.0, 14.0, 11.0, 35.0, 29.0, 64.0, 86.0, 162.0, 301.0, 536.0, 1066.0, 2165.0, 4576.0, 10290.0, 24902.0, 58125.0, 132819.0, 246826.0, 272102.0, 163721.0, 74689.0, 31584.0, 13204.0, 5693.0, 2639.0, 1374.0, 668.0, 369.0, 180.0, 115.0, 73.0, 38.0, 34.0, 11.0, 17.0, 8.0, 2.0, 6.0, 2.0, 6.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-1.861328125, -1.8098297119140625, -1.758331298828125, -1.7068328857421875, -1.65533447265625, -1.6038360595703125, -1.552337646484375, -1.5008392333984375, -1.4493408203125, -1.3978424072265625, -1.346343994140625, -1.2948455810546875, -1.24334716796875, -1.1918487548828125, -1.140350341796875, -1.0888519287109375, -1.037353515625, -0.9858551025390625, -0.934356689453125, -0.8828582763671875, -0.83135986328125, -0.7798614501953125, -0.728363037109375, -0.6768646240234375, -0.6253662109375, -0.5738677978515625, -0.522369384765625, -0.4708709716796875, -0.41937255859375, -0.3678741455078125, -0.316375732421875, -0.2648773193359375, -0.21337890625, -0.1618804931640625, -0.110382080078125, -0.0588836669921875, -0.00738525390625, 0.0441131591796875, 0.095611572265625, 0.1471099853515625, 0.1986083984375, 0.2501068115234375, 0.301605224609375, 0.3531036376953125, 0.40460205078125, 0.4561004638671875, 0.507598876953125, 0.5590972900390625, 0.610595703125, 0.6620941162109375, 0.713592529296875, 0.7650909423828125, 0.81658935546875, 0.8680877685546875, 0.919586181640625, 0.9710845947265625, 1.0225830078125, 1.0740814208984375, 1.125579833984375, 1.1770782470703125, 1.22857666015625, 1.2800750732421875, 1.331573486328125, 1.3830718994140625, 1.4345703125]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 6.0, 5.0, 4.0, 8.0, 19.0, 16.0, 21.0, 25.0, 30.0, 43.0, 51.0, 47.0, 48.0, 58.0, 83.0, 70.0, 70.0, 68.0, 50.0, 68.0, 55.0, 34.0, 33.0, 20.0, 20.0, 8.0, 9.0, 8.0, 11.0, 7.0, 6.0, 4.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.83984375, -3.6943359375, -3.548828125, -3.4033203125, -3.2578125, -3.1123046875, -2.966796875, -2.8212890625, -2.67578125, -2.5302734375, -2.384765625, -2.2392578125, -2.09375, -1.9482421875, -1.802734375, -1.6572265625, -1.51171875, -1.3662109375, -1.220703125, -1.0751953125, -0.9296875, -0.7841796875, -0.638671875, -0.4931640625, -0.34765625, -0.2021484375, -0.056640625, 0.0888671875, 0.234375, 0.3798828125, 0.525390625, 0.6708984375, 0.81640625, 0.9619140625, 1.107421875, 1.2529296875, 1.3984375, 1.5439453125, 1.689453125, 1.8349609375, 1.98046875, 2.1259765625, 2.271484375, 2.4169921875, 2.5625, 2.7080078125, 2.853515625, 2.9990234375, 3.14453125, 3.2900390625, 3.435546875, 3.5810546875, 3.7265625, 3.8720703125, 4.017578125, 4.1630859375, 4.30859375, 4.4541015625, 4.599609375, 4.7451171875, 4.890625, 5.0361328125, 5.181640625, 5.3271484375, 5.47265625]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 5.0, 5.0, 4.0, 6.0, 12.0, 7.0, 10.0, 6.0, 5.0, 12.0, 14.0, 22.0, 23.0, 29.0, 23.0, 39.0, 39.0, 47.0, 73.0, 126.0, 210.0, 466.0, 3136.0, 277323.0, 755188.0, 10210.0, 700.0, 255.0, 138.0, 90.0, 51.0, 46.0, 31.0, 41.0, 21.0, 18.0, 14.0, 20.0, 16.0, 22.0, 9.0, 11.0, 6.0, 3.0, 6.0, 3.0, 4.0, 5.0, 2.0, 8.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-8.890625, -8.6141357421875, -8.337646484375, -8.0611572265625, -7.78466796875, -7.5081787109375, -7.231689453125, -6.9552001953125, -6.6787109375, -6.4022216796875, -6.125732421875, -5.8492431640625, -5.57275390625, -5.2962646484375, -5.019775390625, -4.7432861328125, -4.466796875, -4.1903076171875, -3.913818359375, -3.6373291015625, -3.36083984375, -3.0843505859375, -2.807861328125, -2.5313720703125, -2.2548828125, -1.9783935546875, -1.701904296875, -1.4254150390625, -1.14892578125, -0.8724365234375, -0.595947265625, -0.3194580078125, -0.04296875, 0.2335205078125, 0.510009765625, 0.7864990234375, 1.06298828125, 1.3394775390625, 1.615966796875, 1.8924560546875, 2.1689453125, 2.4454345703125, 2.721923828125, 2.9984130859375, 3.27490234375, 3.5513916015625, 3.827880859375, 4.1043701171875, 4.380859375, 4.6573486328125, 4.933837890625, 5.2103271484375, 5.48681640625, 5.7633056640625, 6.039794921875, 6.3162841796875, 6.5927734375, 6.8692626953125, 7.145751953125, 7.4222412109375, 7.69873046875, 7.9752197265625, 8.251708984375, 8.5281982421875, 8.8046875]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 6.0, 9.0, 9.0, 8.0, 9.0, 10.0, 13.0, 20.0, 20.0, 24.0, 25.0, 21.0, 21.0, 38.0, 41.0, 43.0, 33.0, 35.0, 41.0, 43.0, 46.0, 47.0, 44.0, 36.0, 33.0, 35.0, 34.0, 30.0, 39.0, 35.0, 31.0, 19.0, 16.0, 17.0, 12.0, 13.0, 11.0, 7.0, 4.0, 6.0, 4.0, 2.0, 5.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.36328125, -3.25921630859375, -3.1551513671875, -3.05108642578125, -2.947021484375, -2.84295654296875, -2.7388916015625, -2.63482666015625, -2.53076171875, -2.42669677734375, -2.3226318359375, -2.21856689453125, -2.114501953125, -2.01043701171875, -1.9063720703125, -1.80230712890625, -1.6982421875, -1.59417724609375, -1.4901123046875, -1.38604736328125, -1.281982421875, -1.17791748046875, -1.0738525390625, -0.96978759765625, -0.86572265625, -0.76165771484375, -0.6575927734375, -0.55352783203125, -0.449462890625, -0.34539794921875, -0.2413330078125, -0.13726806640625, -0.033203125, 0.07086181640625, 0.1749267578125, 0.27899169921875, 0.383056640625, 0.48712158203125, 0.5911865234375, 0.69525146484375, 0.79931640625, 0.90338134765625, 1.0074462890625, 1.11151123046875, 1.215576171875, 1.31964111328125, 1.4237060546875, 1.52777099609375, 1.6318359375, 1.73590087890625, 1.8399658203125, 1.94403076171875, 2.048095703125, 2.15216064453125, 2.2562255859375, 2.36029052734375, 2.46435546875, 2.56842041015625, 2.6724853515625, 2.77655029296875, 2.880615234375, 2.98468017578125, 3.0887451171875, 3.19281005859375, 3.296875]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 4.0, 2.0, 9.0, 5.0, 8.0, 17.0, 45.0, 81.0, 190.0, 601.0, 2565.0, 27000.0, 860918.0, 149886.0, 5636.0, 1020.0, 297.0, 124.0, 68.0, 34.0, 6.0, 7.0, 8.0, 11.0, 5.0, 2.0, 5.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.77734375, -2.6949462890625, -2.612548828125, -2.5301513671875, -2.44775390625, -2.3653564453125, -2.282958984375, -2.2005615234375, -2.1181640625, -2.0357666015625, -1.953369140625, -1.8709716796875, -1.78857421875, -1.7061767578125, -1.623779296875, -1.5413818359375, -1.458984375, -1.3765869140625, -1.294189453125, -1.2117919921875, -1.12939453125, -1.0469970703125, -0.964599609375, -0.8822021484375, -0.7998046875, -0.7174072265625, -0.635009765625, -0.5526123046875, -0.47021484375, -0.3878173828125, -0.305419921875, -0.2230224609375, -0.140625, -0.0582275390625, 0.024169921875, 0.1065673828125, 0.18896484375, 0.2713623046875, 0.353759765625, 0.4361572265625, 0.5185546875, 0.6009521484375, 0.683349609375, 0.7657470703125, 0.84814453125, 0.9305419921875, 1.012939453125, 1.0953369140625, 1.177734375, 1.2601318359375, 1.342529296875, 1.4249267578125, 1.50732421875, 1.5897216796875, 1.672119140625, 1.7545166015625, 1.8369140625, 1.9193115234375, 2.001708984375, 2.0841064453125, 2.16650390625, 2.2489013671875, 2.331298828125, 2.4136962890625, 2.49609375]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 0.0, 3.0, 4.0, 9.0, 4.0, 10.0, 10.0, 19.0, 25.0, 42.0, 52.0, 64.0, 94.0, 93.0, 107.0, 109.0, 90.0, 83.0, 51.0, 35.0, 19.0, 23.0, 14.0, 16.0, 8.0, 7.0, 6.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00017917156219482422, -0.0001738760620355606, -0.000168580561876297, -0.00016328506171703339, -0.00015798956155776978, -0.00015269406139850616, -0.00014739856123924255, -0.00014210306107997894, -0.00013680756092071533, -0.00013151206076145172, -0.0001262165606021881, -0.0001209210604429245, -0.00011562556028366089, -0.00011033006012439728, -0.00010503455996513367, -9.973905980587006e-05, -9.444355964660645e-05, -8.914805948734283e-05, -8.385255932807922e-05, -7.855705916881561e-05, -7.3261559009552e-05, -6.796605885028839e-05, -6.267055869102478e-05, -5.737505853176117e-05, -5.207955837249756e-05, -4.678405821323395e-05, -4.148855805397034e-05, -3.6193057894706726e-05, -3.0897557735443115e-05, -2.5602057576179504e-05, -2.0306557416915894e-05, -1.5011057257652283e-05, -9.715557098388672e-06, -4.420056939125061e-06, 8.754432201385498e-07, 6.170943379402161e-06, 1.1466443538665771e-05, 1.6761943697929382e-05, 2.2057443857192993e-05, 2.7352944016456604e-05, 3.2648444175720215e-05, 3.7943944334983826e-05, 4.3239444494247437e-05, 4.853494465351105e-05, 5.383044481277466e-05, 5.912594497203827e-05, 6.442144513130188e-05, 6.971694529056549e-05, 7.50124454498291e-05, 8.030794560909271e-05, 8.560344576835632e-05, 9.089894592761993e-05, 9.619444608688354e-05, 0.00010148994624614716, 0.00010678544640541077, 0.00011208094656467438, 0.00011737644672393799, 0.0001226719468832016, 0.0001279674470424652, 0.00013326294720172882, 0.00013855844736099243, 0.00014385394752025604, 0.00014914944767951965, 0.00015444494783878326, 0.00015974044799804688]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 1.0, 3.0, 4.0, 2.0, 1.0, 5.0, 4.0, 10.0, 13.0, 15.0, 28.0, 53.0, 112.0, 370.0, 1513.0, 16266.0, 620850.0, 397202.0, 10267.0, 1271.0, 346.0, 98.0, 51.0, 31.0, 13.0, 5.0, 11.0, 3.0, 3.0, 6.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.63671875, -2.558990478515625, -2.48126220703125, -2.403533935546875, -2.3258056640625, -2.248077392578125, -2.17034912109375, -2.092620849609375, -2.014892578125, -1.937164306640625, -1.85943603515625, -1.781707763671875, -1.7039794921875, -1.626251220703125, -1.54852294921875, -1.470794677734375, -1.39306640625, -1.315338134765625, -1.23760986328125, -1.159881591796875, -1.0821533203125, -1.004425048828125, -0.92669677734375, -0.848968505859375, -0.771240234375, -0.693511962890625, -0.61578369140625, -0.538055419921875, -0.4603271484375, -0.382598876953125, -0.30487060546875, -0.227142333984375, -0.1494140625, -0.071685791015625, 0.00604248046875, 0.083770751953125, 0.1614990234375, 0.239227294921875, 0.31695556640625, 0.394683837890625, 0.472412109375, 0.550140380859375, 0.62786865234375, 0.705596923828125, 0.7833251953125, 0.861053466796875, 0.93878173828125, 1.016510009765625, 1.09423828125, 1.171966552734375, 1.24969482421875, 1.327423095703125, 1.4051513671875, 1.482879638671875, 1.56060791015625, 1.638336181640625, 1.716064453125, 1.793792724609375, 1.87152099609375, 1.949249267578125, 2.0269775390625, 2.104705810546875, 2.18243408203125, 2.260162353515625, 2.337890625]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 4.0, 7.0, 8.0, 17.0, 23.0, 21.0, 40.0, 62.0, 64.0, 87.0, 106.0, 107.0, 118.0, 84.0, 72.0, 50.0, 44.0, 27.0, 20.0, 10.0, 6.0, 5.0, 11.0, 0.0, 4.0, 3.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.59912109375, -0.5812911987304688, -0.5634613037109375, -0.5456314086914062, -0.527801513671875, -0.5099716186523438, -0.4921417236328125, -0.47431182861328125, -0.45648193359375, -0.43865203857421875, -0.4208221435546875, -0.40299224853515625, -0.385162353515625, -0.36733245849609375, -0.3495025634765625, -0.33167266845703125, -0.3138427734375, -0.29601287841796875, -0.2781829833984375, -0.26035308837890625, -0.242523193359375, -0.22469329833984375, -0.2068634033203125, -0.18903350830078125, -0.17120361328125, -0.15337371826171875, -0.1355438232421875, -0.11771392822265625, -0.099884033203125, -0.08205413818359375, -0.0642242431640625, -0.04639434814453125, -0.028564453125, -0.01073455810546875, 0.0070953369140625, 0.02492523193359375, 0.042755126953125, 0.06058502197265625, 0.0784149169921875, 0.09624481201171875, 0.11407470703125, 0.13190460205078125, 0.1497344970703125, 0.16756439208984375, 0.185394287109375, 0.20322418212890625, 0.2210540771484375, 0.23888397216796875, 0.2567138671875, 0.27454376220703125, 0.2923736572265625, 0.31020355224609375, 0.328033447265625, 0.34586334228515625, 0.3636932373046875, 0.38152313232421875, 0.39935302734375, 0.41718292236328125, 0.4350128173828125, 0.45284271240234375, 0.470672607421875, 0.48850250244140625, 0.5063323974609375, 0.5241622924804688, 0.5419921875]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 6.0, 9.0, 25.0, 59.0, 144.0, 200.0, 206.0, 162.0, 110.0, 50.0, 22.0, 13.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0], "bins": [-21.55654525756836, -21.14507293701172, -20.733600616455078, -20.322128295898438, -19.910655975341797, -19.499183654785156, -19.087711334228516, -18.676237106323242, -18.2647647857666, -17.85329246520996, -17.44182014465332, -17.03034782409668, -16.61887550354004, -16.207401275634766, -15.795929908752441, -15.3844575881958, -14.97298526763916, -14.56151294708252, -14.150040626525879, -13.738567352294922, -13.327095031738281, -12.91562271118164, -12.504150390625, -12.09267807006836, -11.681205749511719, -11.269733428955078, -10.858261108398438, -10.446788787841797, -10.03531551361084, -9.6238431930542, -9.212370872497559, -8.800898551940918, -8.389424324035645, -7.977952003479004, -7.566479206085205, -7.1550068855285645, -6.743534088134766, -6.332061767578125, -5.920589447021484, -5.509117126464844, -5.097644329071045, -4.686172008514404, -4.2746992111206055, -3.863226890563965, -3.451754331588745, -3.0402817726135254, -2.6288094520568848, -2.217336893081665, -1.8058643341064453, -1.3943917751312256, -0.9829193353652954, -0.5714468955993652, -0.1599743366241455, 0.2514982223510742, 0.6629705429077148, 1.0744431018829346, 1.4859156608581543, 1.897388219833374, 2.3088607788085938, 2.7203330993652344, 3.131805658340454, 3.543278217315674, 3.9547505378723145, 4.366223335266113, 4.777695655822754]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 1.0, 5.0, 5.0, 10.0, 12.0, 13.0, 19.0, 29.0, 18.0, 19.0, 22.0, 40.0, 26.0, 40.0, 49.0, 40.0, 49.0, 47.0, 47.0, 54.0, 57.0, 51.0, 49.0, 37.0, 46.0, 30.0, 40.0, 31.0, 29.0, 13.0, 19.0, 15.0, 15.0, 4.0, 8.0, 7.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.909377098083496, -5.702003479003906, -5.494629859924316, -5.287256240844727, -5.079882621765137, -4.872509002685547, -4.665135383605957, -4.457761764526367, -4.250388145446777, -4.0430145263671875, -3.8356409072875977, -3.628267288208008, -3.420893669128418, -3.213520050048828, -3.0061464309692383, -2.7987728118896484, -2.5913991928100586, -2.3840255737304688, -2.176651954650879, -1.969278335571289, -1.7619047164916992, -1.5545310974121094, -1.3471574783325195, -1.1397838592529297, -0.9324102401733398, -0.72503662109375, -0.5176630020141602, -0.3102893829345703, -0.10291576385498047, 0.10445785522460938, 0.3118314743041992, 0.5192050933837891, 0.7265787124633789, 0.9339523315429688, 1.1413259506225586, 1.3486995697021484, 1.5560731887817383, 1.7634468078613281, 1.970820426940918, 2.178194046020508, 2.3855676651000977, 2.5929412841796875, 2.8003149032592773, 3.007688522338867, 3.215062141418457, 3.422435760498047, 3.6298093795776367, 3.8371829986572266, 4.044556617736816, 4.251930236816406, 4.459303855895996, 4.666677474975586, 4.874051094055176, 5.081424713134766, 5.2887983322143555, 5.496171951293945, 5.703545570373535, 5.910919189453125, 6.118292808532715, 6.325666427612305, 6.5330400466918945, 6.740413665771484, 6.947787284851074, 7.155160903930664, 7.362534523010254]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 7.0, 6.0, 16.0, 19.0, 35.0, 35.0, 42.0, 93.0, 138.0, 203.0, 354.0, 741.0, 2088.0, 12797.0, 205403.0, 2714576.0, 1195646.0, 55574.0, 4755.0, 963.0, 316.0, 180.0, 89.0, 64.0, 41.0, 32.0, 23.0, 14.0, 17.0, 10.0, 6.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.078125, -5.8740234375, -5.669921875, -5.4658203125, -5.26171875, -5.0576171875, -4.853515625, -4.6494140625, -4.4453125, -4.2412109375, -4.037109375, -3.8330078125, -3.62890625, -3.4248046875, -3.220703125, -3.0166015625, -2.8125, -2.6083984375, -2.404296875, -2.2001953125, -1.99609375, -1.7919921875, -1.587890625, -1.3837890625, -1.1796875, -0.9755859375, -0.771484375, -0.5673828125, -0.36328125, -0.1591796875, 0.044921875, 0.2490234375, 0.453125, 0.6572265625, 0.861328125, 1.0654296875, 1.26953125, 1.4736328125, 1.677734375, 1.8818359375, 2.0859375, 2.2900390625, 2.494140625, 2.6982421875, 2.90234375, 3.1064453125, 3.310546875, 3.5146484375, 3.71875, 3.9228515625, 4.126953125, 4.3310546875, 4.53515625, 4.7392578125, 4.943359375, 5.1474609375, 5.3515625, 5.5556640625, 5.759765625, 5.9638671875, 6.16796875, 6.3720703125, 6.576171875, 6.7802734375, 6.984375]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 5.0, 6.0, 11.0, 8.0, 6.0, 6.0, 11.0, 21.0, 23.0, 28.0, 29.0, 34.0, 44.0, 29.0, 56.0, 60.0, 47.0, 49.0, 55.0, 55.0, 60.0, 56.0, 41.0, 45.0, 52.0, 28.0, 36.0, 21.0, 20.0, 17.0, 9.0, 12.0, 5.0, 8.0, 6.0, 9.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.314453125, -2.219879150390625, -2.12530517578125, -2.030731201171875, -1.9361572265625, -1.841583251953125, -1.74700927734375, -1.652435302734375, -1.557861328125, -1.463287353515625, -1.36871337890625, -1.274139404296875, -1.1795654296875, -1.084991455078125, -0.99041748046875, -0.895843505859375, -0.80126953125, -0.706695556640625, -0.61212158203125, -0.517547607421875, -0.4229736328125, -0.328399658203125, -0.23382568359375, -0.139251708984375, -0.044677734375, 0.049896240234375, 0.14447021484375, 0.239044189453125, 0.3336181640625, 0.428192138671875, 0.52276611328125, 0.617340087890625, 0.7119140625, 0.806488037109375, 0.90106201171875, 0.995635986328125, 1.0902099609375, 1.184783935546875, 1.27935791015625, 1.373931884765625, 1.468505859375, 1.563079833984375, 1.65765380859375, 1.752227783203125, 1.8468017578125, 1.941375732421875, 2.03594970703125, 2.130523681640625, 2.22509765625, 2.319671630859375, 2.41424560546875, 2.508819580078125, 2.6033935546875, 2.697967529296875, 2.79254150390625, 2.887115478515625, 2.981689453125, 3.076263427734375, 3.17083740234375, 3.265411376953125, 3.3599853515625, 3.454559326171875, 3.54913330078125, 3.643707275390625, 3.73828125]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 19.0, 25.0, 90.0, 451.0, 7932.0, 4143228.0, 41581.0, 722.0, 172.0, 44.0, 20.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.625, -26.04150390625, -25.4580078125, -24.87451171875, -24.291015625, -23.70751953125, -23.1240234375, -22.54052734375, -21.95703125, -21.37353515625, -20.7900390625, -20.20654296875, -19.623046875, -19.03955078125, -18.4560546875, -17.87255859375, -17.2890625, -16.70556640625, -16.1220703125, -15.53857421875, -14.955078125, -14.37158203125, -13.7880859375, -13.20458984375, -12.62109375, -12.03759765625, -11.4541015625, -10.87060546875, -10.287109375, -9.70361328125, -9.1201171875, -8.53662109375, -7.953125, -7.36962890625, -6.7861328125, -6.20263671875, -5.619140625, -5.03564453125, -4.4521484375, -3.86865234375, -3.28515625, -2.70166015625, -2.1181640625, -1.53466796875, -0.951171875, -0.36767578125, 0.2158203125, 0.79931640625, 1.3828125, 1.96630859375, 2.5498046875, 3.13330078125, 3.716796875, 4.30029296875, 4.8837890625, 5.46728515625, 6.05078125, 6.63427734375, 7.2177734375, 7.80126953125, 8.384765625, 8.96826171875, 9.5517578125, 10.13525390625, 10.71875]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 5.0, 4.0, 10.0, 12.0, 19.0, 18.0, 30.0, 56.0, 103.0, 152.0, 267.0, 384.0, 498.0, 641.0, 624.0, 467.0, 297.0, 182.0, 121.0, 83.0, 45.0, 19.0, 13.0, 8.0, 7.0, 4.0, 2.0, 5.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4130859375, -1.3638763427734375, -1.314666748046875, -1.2654571533203125, -1.21624755859375, -1.1670379638671875, -1.117828369140625, -1.0686187744140625, -1.0194091796875, -0.9701995849609375, -0.920989990234375, -0.8717803955078125, -0.82257080078125, -0.7733612060546875, -0.724151611328125, -0.6749420166015625, -0.625732421875, -0.5765228271484375, -0.527313232421875, -0.4781036376953125, -0.42889404296875, -0.3796844482421875, -0.330474853515625, -0.2812652587890625, -0.2320556640625, -0.1828460693359375, -0.133636474609375, -0.0844268798828125, -0.03521728515625, 0.0139923095703125, 0.063201904296875, 0.1124114990234375, 0.16162109375, 0.2108306884765625, 0.260040283203125, 0.3092498779296875, 0.35845947265625, 0.4076690673828125, 0.456878662109375, 0.5060882568359375, 0.5552978515625, 0.6045074462890625, 0.653717041015625, 0.7029266357421875, 0.75213623046875, 0.8013458251953125, 0.850555419921875, 0.8997650146484375, 0.948974609375, 0.9981842041015625, 1.047393798828125, 1.0966033935546875, 1.14581298828125, 1.1950225830078125, 1.244232177734375, 1.2934417724609375, 1.3426513671875, 1.3918609619140625, 1.441070556640625, 1.4902801513671875, 1.53948974609375, 1.5886993408203125, 1.637908935546875, 1.6871185302734375, 1.736328125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 5.0, 5.0, 15.0, 30.0, 37.0, 44.0, 71.0, 112.0, 132.0, 129.0, 128.0, 108.0, 61.0, 48.0, 34.0, 20.0, 11.0, 7.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.638984680175781, -6.447938442230225, -6.256892204284668, -6.065845966339111, -5.874799728393555, -5.683753967285156, -5.492707252502441, -5.301661491394043, -5.110615253448486, -4.91956901550293, -4.728522777557373, -4.537476539611816, -4.34643030166626, -4.155384063720703, -3.9643380641937256, -3.773292064666748, -3.5822455883026123, -3.3911993503570557, -3.200153112411499, -3.0091071128845215, -2.818060874938965, -2.627014636993408, -2.4359683990478516, -2.244922161102295, -2.0538759231567383, -1.8628296852111816, -1.6717835664749146, -1.480737328529358, -1.2896912097930908, -1.0986449718475342, -0.9075987339019775, -0.7165526151657104, -0.5255064964294434, -0.3344603180885315, -0.14341410994529724, 0.04763209819793701, 0.23867827653884888, 0.42972445487976074, 0.6207706928253174, 0.8118168115615845, 1.0028630495071411, 1.1939092874526978, 1.3849554061889648, 1.5760016441345215, 1.7670478820800781, 1.9580940008163452, 2.1491403579711914, 2.340186357498169, 2.5312325954437256, 2.7222788333892822, 2.913325071334839, 3.1043710708618164, 3.295417308807373, 3.4864635467529297, 3.6775097846984863, 3.868556022644043, 4.0596022605896, 4.250648498535156, 4.441694736480713, 4.6327409744262695, 4.823787212371826, 5.014833450317383, 5.205879211425781, 5.396925449371338, 5.5879716873168945]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 5.0, 2.0, 2.0, 4.0, 4.0, 0.0, 5.0, 8.0, 5.0, 12.0, 10.0, 14.0, 19.0, 17.0, 16.0, 17.0, 18.0, 30.0, 31.0, 29.0, 36.0, 29.0, 41.0, 46.0, 42.0, 44.0, 48.0, 43.0, 55.0, 41.0, 36.0, 29.0, 28.0, 26.0, 33.0, 28.0, 25.0, 14.0, 16.0, 19.0, 21.0, 11.0, 12.0, 8.0, 2.0, 6.0, 5.0, 6.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-2.3792097568511963, -2.297116279602051, -2.2150228023529053, -2.1329293251037598, -2.050835609436035, -1.9687422513961792, -1.8866486549377441, -1.8045551776885986, -1.7224617004394531, -1.6403682231903076, -1.558274745941162, -1.476181149482727, -1.3940876722335815, -1.311994194984436, -1.229900598526001, -1.1478071212768555, -1.06571364402771, -0.9836201667785645, -0.9015266299247742, -0.8194330930709839, -0.7373396158218384, -0.6552461385726929, -0.5731526017189026, -0.4910590648651123, -0.4089655876159668, -0.3268720805644989, -0.244778573513031, -0.1626850664615631, -0.08059155941009521, 0.0015019476413726807, 0.08359545469284058, 0.16568899154663086, 0.24778223037719727, 0.32987573742866516, 0.41196924448013306, 0.49406275153160095, 0.5761562585830688, 0.6582497358322144, 0.7403432726860046, 0.8224368095397949, 0.9045302867889404, 0.9866237640380859, 1.0687172412872314, 1.1508108377456665, 1.232904314994812, 1.3149977922439575, 1.3970913887023926, 1.479184865951538, 1.5612783432006836, 1.643371820449829, 1.7254652976989746, 1.8075588941574097, 1.8896523714065552, 1.9717458486557007, 2.0538394451141357, 2.1359329223632812, 2.2180263996124268, 2.3001198768615723, 2.3822133541107178, 2.4643068313598633, 2.546400547027588, 2.6284940242767334, 2.710587501525879, 2.7926809787750244, 2.87477445602417]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 16.0, 17.0, 21.0, 27.0, 50.0, 101.0, 195.0, 405.0, 1106.0, 4169.0, 23243.0, 195751.0, 664484.0, 136735.0, 17254.0, 3337.0, 934.0, 337.0, 149.0, 93.0, 53.0, 40.0, 18.0, 12.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8994140625, -0.8653717041015625, -0.831329345703125, -0.7972869873046875, -0.76324462890625, -0.7292022705078125, -0.695159912109375, -0.6611175537109375, -0.6270751953125, -0.5930328369140625, -0.558990478515625, -0.5249481201171875, -0.49090576171875, -0.4568634033203125, -0.422821044921875, -0.3887786865234375, -0.354736328125, -0.3206939697265625, -0.286651611328125, -0.2526092529296875, -0.21856689453125, -0.1845245361328125, -0.150482177734375, -0.1164398193359375, -0.0823974609375, -0.0483551025390625, -0.014312744140625, 0.0197296142578125, 0.05377197265625, 0.0878143310546875, 0.121856689453125, 0.1558990478515625, 0.18994140625, 0.2239837646484375, 0.258026123046875, 0.2920684814453125, 0.32611083984375, 0.3601531982421875, 0.394195556640625, 0.4282379150390625, 0.4622802734375, 0.4963226318359375, 0.530364990234375, 0.5644073486328125, 0.59844970703125, 0.6324920654296875, 0.666534423828125, 0.7005767822265625, 0.734619140625, 0.7686614990234375, 0.802703857421875, 0.8367462158203125, 0.87078857421875, 0.9048309326171875, 0.938873291015625, 0.9729156494140625, 1.0069580078125, 1.0410003662109375, 1.075042724609375, 1.1090850830078125, 1.14312744140625, 1.1771697998046875, 1.211212158203125, 1.2452545166015625, 1.279296875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 5.0, 3.0, 6.0, 11.0, 10.0, 20.0, 26.0, 41.0, 28.0, 51.0, 76.0, 94.0, 81.0, 99.0, 86.0, 81.0, 53.0, 56.0, 59.0, 39.0, 19.0, 21.0, 20.0, 9.0, 6.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4921875, -2.382080078125, -2.27197265625, -2.161865234375, -2.0517578125, -1.941650390625, -1.83154296875, -1.721435546875, -1.611328125, -1.501220703125, -1.39111328125, -1.281005859375, -1.1708984375, -1.060791015625, -0.95068359375, -0.840576171875, -0.73046875, -0.620361328125, -0.51025390625, -0.400146484375, -0.2900390625, -0.179931640625, -0.06982421875, 0.040283203125, 0.150390625, 0.260498046875, 0.37060546875, 0.480712890625, 0.5908203125, 0.700927734375, 0.81103515625, 0.921142578125, 1.03125, 1.141357421875, 1.25146484375, 1.361572265625, 1.4716796875, 1.581787109375, 1.69189453125, 1.802001953125, 1.912109375, 2.022216796875, 2.13232421875, 2.242431640625, 2.3525390625, 2.462646484375, 2.57275390625, 2.682861328125, 2.79296875, 2.903076171875, 3.01318359375, 3.123291015625, 3.2333984375, 3.343505859375, 3.45361328125, 3.563720703125, 3.673828125, 3.783935546875, 3.89404296875, 4.004150390625, 4.1142578125, 4.224365234375, 4.33447265625, 4.444580078125, 4.5546875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 5.0, 8.0, 9.0, 17.0, 17.0, 23.0, 47.0, 59.0, 91.0, 159.0, 227.0, 336.0, 544.0, 875.0, 1424.0, 2359.0, 3934.0, 6678.0, 11350.0, 19652.0, 33386.0, 55729.0, 89925.0, 135190.0, 171917.0, 169557.0, 129964.0, 85821.0, 53160.0, 31153.0, 18252.0, 10731.0, 6353.0, 3797.0, 2148.0, 1312.0, 801.0, 558.0, 328.0, 223.0, 146.0, 104.0, 60.0, 32.0, 33.0, 16.0, 14.0, 8.0, 9.0, 6.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.1917724609375, -0.1851482391357422, -0.17852401733398438, -0.17189979553222656, -0.16527557373046875, -0.15865135192871094, -0.15202713012695312, -0.1454029083251953, -0.1387786865234375, -0.1321544647216797, -0.12553024291992188, -0.11890602111816406, -0.11228179931640625, -0.10565757751464844, -0.09903335571289062, -0.09240913391113281, -0.085784912109375, -0.07916069030761719, -0.07253646850585938, -0.06591224670410156, -0.05928802490234375, -0.05266380310058594, -0.046039581298828125, -0.03941535949707031, -0.0327911376953125, -0.026166915893554688, -0.019542694091796875, -0.012918472290039062, -0.00629425048828125, 0.0003299713134765625, 0.006954193115234375, 0.013578414916992188, 0.02020263671875, 0.026826858520507812, 0.033451080322265625, 0.04007530212402344, 0.04669952392578125, 0.05332374572753906, 0.059947967529296875, 0.06657218933105469, 0.0731964111328125, 0.07982063293457031, 0.08644485473632812, 0.09306907653808594, 0.09969329833984375, 0.10631752014160156, 0.11294174194335938, 0.11956596374511719, 0.126190185546875, 0.1328144073486328, 0.13943862915039062, 0.14606285095214844, 0.15268707275390625, 0.15931129455566406, 0.16593551635742188, 0.1725597381591797, 0.1791839599609375, 0.1858081817626953, 0.19243240356445312, 0.19905662536621094, 0.20568084716796875, 0.21230506896972656, 0.21892929077148438, 0.2255535125732422, 0.232177734375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 4.0, 5.0, 5.0, 2.0, 13.0, 16.0, 17.0, 18.0, 25.0, 20.0, 39.0, 40.0, 37.0, 48.0, 24.0, 63.0, 64.0, 50.0, 44.0, 51.0, 48.0, 43.0, 37.0, 36.0, 31.0, 40.0, 29.0, 37.0, 26.0, 18.0, 13.0, 19.0, 11.0, 8.0, 8.0, 10.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.560546875, -3.432220458984375, -3.30389404296875, -3.175567626953125, -3.0472412109375, -2.918914794921875, -2.79058837890625, -2.662261962890625, -2.533935546875, -2.405609130859375, -2.27728271484375, -2.148956298828125, -2.0206298828125, -1.892303466796875, -1.76397705078125, -1.635650634765625, -1.50732421875, -1.378997802734375, -1.25067138671875, -1.122344970703125, -0.9940185546875, -0.865692138671875, -0.73736572265625, -0.609039306640625, -0.480712890625, -0.352386474609375, -0.22406005859375, -0.095733642578125, 0.0325927734375, 0.160919189453125, 0.28924560546875, 0.417572021484375, 0.5458984375, 0.674224853515625, 0.80255126953125, 0.930877685546875, 1.0592041015625, 1.187530517578125, 1.31585693359375, 1.444183349609375, 1.572509765625, 1.700836181640625, 1.82916259765625, 1.957489013671875, 2.0858154296875, 2.214141845703125, 2.34246826171875, 2.470794677734375, 2.59912109375, 2.727447509765625, 2.85577392578125, 2.984100341796875, 3.1124267578125, 3.240753173828125, 3.36907958984375, 3.497406005859375, 3.625732421875, 3.754058837890625, 3.88238525390625, 4.010711669921875, 4.1390380859375, 4.267364501953125, 4.39569091796875, 4.524017333984375, 4.65234375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 8.0, 6.0, 6.0, 17.0, 10.0, 21.0, 33.0, 44.0, 68.0, 92.0, 144.0, 202.0, 348.0, 514.0, 823.0, 1532.0, 2727.0, 5752.0, 13316.0, 34658.0, 96051.0, 236832.0, 335797.0, 195295.0, 75481.0, 27537.0, 10753.0, 4782.0, 2311.0, 1251.0, 780.0, 456.0, 266.0, 195.0, 136.0, 106.0, 73.0, 32.0, 23.0, 18.0, 13.0, 16.0, 10.0, 4.0, 7.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.04296875, -0.0416417121887207, -0.040314674377441406, -0.03898763656616211, -0.03766059875488281, -0.036333560943603516, -0.03500652313232422, -0.03367948532104492, -0.032352447509765625, -0.031025409698486328, -0.02969837188720703, -0.028371334075927734, -0.027044296264648438, -0.02571725845336914, -0.024390220642089844, -0.023063182830810547, -0.02173614501953125, -0.020409107208251953, -0.019082069396972656, -0.01775503158569336, -0.016427993774414062, -0.015100955963134766, -0.013773918151855469, -0.012446880340576172, -0.011119842529296875, -0.009792804718017578, -0.008465766906738281, -0.007138729095458984, -0.0058116912841796875, -0.004484653472900391, -0.0031576156616210938, -0.0018305778503417969, -0.0005035400390625, 0.0008234977722167969, 0.0021505355834960938, 0.0034775733947753906, 0.0048046112060546875, 0.006131649017333984, 0.007458686828613281, 0.008785724639892578, 0.010112762451171875, 0.011439800262451172, 0.012766838073730469, 0.014093875885009766, 0.015420913696289062, 0.01674795150756836, 0.018074989318847656, 0.019402027130126953, 0.02072906494140625, 0.022056102752685547, 0.023383140563964844, 0.02471017837524414, 0.026037216186523438, 0.027364253997802734, 0.02869129180908203, 0.030018329620361328, 0.031345367431640625, 0.03267240524291992, 0.03399944305419922, 0.035326480865478516, 0.03665351867675781, 0.03798055648803711, 0.039307594299316406, 0.0406346321105957, 0.041961669921875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 5.0, 1.0, 5.0, 5.0, 12.0, 6.0, 12.0, 12.0, 26.0, 22.0, 24.0, 35.0, 45.0, 44.0, 53.0, 54.0, 63.0, 74.0, 75.0, 71.0, 68.0, 45.0, 39.0, 48.0, 24.0, 32.0, 22.0, 18.0, 8.0, 13.0, 11.0, 10.0, 3.0, 5.0, 2.0, 2.0, 4.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.361701965332031e-05, -3.2568350434303284e-05, -3.1519681215286255e-05, -3.0471011996269226e-05, -2.9422342777252197e-05, -2.837367355823517e-05, -2.732500433921814e-05, -2.627633512020111e-05, -2.5227665901184082e-05, -2.4178996682167053e-05, -2.3130327463150024e-05, -2.2081658244132996e-05, -2.1032989025115967e-05, -1.9984319806098938e-05, -1.893565058708191e-05, -1.788698136806488e-05, -1.683831214904785e-05, -1.5789642930030823e-05, -1.4740973711013794e-05, -1.3692304491996765e-05, -1.2643635272979736e-05, -1.1594966053962708e-05, -1.0546296834945679e-05, -9.49762761592865e-06, -8.448958396911621e-06, -7.400289177894592e-06, -6.3516199588775635e-06, -5.302950739860535e-06, -4.254281520843506e-06, -3.205612301826477e-06, -2.1569430828094482e-06, -1.1082738637924194e-06, -5.960464477539063e-08, 9.890645742416382e-07, 2.037733793258667e-06, 3.086403012275696e-06, 4.135072231292725e-06, 5.183741450309753e-06, 6.232410669326782e-06, 7.281079888343811e-06, 8.32974910736084e-06, 9.378418326377869e-06, 1.0427087545394897e-05, 1.1475756764411926e-05, 1.2524425983428955e-05, 1.3573095202445984e-05, 1.4621764421463013e-05, 1.567043364048004e-05, 1.671910285949707e-05, 1.77677720785141e-05, 1.8816441297531128e-05, 1.9865110516548157e-05, 2.0913779735565186e-05, 2.1962448954582214e-05, 2.3011118173599243e-05, 2.4059787392616272e-05, 2.51084566116333e-05, 2.615712583065033e-05, 2.720579504966736e-05, 2.8254464268684387e-05, 2.9303133487701416e-05, 3.0351802706718445e-05, 3.1400471925735474e-05, 3.24491411447525e-05, 3.349781036376953e-05]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 0.0, 4.0, 4.0, 5.0, 5.0, 14.0, 14.0, 19.0, 29.0, 46.0, 82.0, 156.0, 291.0, 565.0, 1480.0, 4565.0, 16836.0, 79714.0, 367949.0, 438856.0, 107131.0, 21833.0, 5687.0, 1787.0, 732.0, 328.0, 169.0, 90.0, 58.0, 33.0, 23.0, 8.0, 10.0, 10.0, 6.0, 3.0, 1.0, 6.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.06640625, -0.06427001953125, -0.0621337890625, -0.05999755859375, -0.057861328125, -0.05572509765625, -0.0535888671875, -0.05145263671875, -0.04931640625, -0.04718017578125, -0.0450439453125, -0.04290771484375, -0.040771484375, -0.03863525390625, -0.0364990234375, -0.03436279296875, -0.0322265625, -0.03009033203125, -0.0279541015625, -0.02581787109375, -0.023681640625, -0.02154541015625, -0.0194091796875, -0.01727294921875, -0.01513671875, -0.01300048828125, -0.0108642578125, -0.00872802734375, -0.006591796875, -0.00445556640625, -0.0023193359375, -0.00018310546875, 0.001953125, 0.00408935546875, 0.0062255859375, 0.00836181640625, 0.010498046875, 0.01263427734375, 0.0147705078125, 0.01690673828125, 0.01904296875, 0.02117919921875, 0.0233154296875, 0.02545166015625, 0.027587890625, 0.02972412109375, 0.0318603515625, 0.03399658203125, 0.0361328125, 0.03826904296875, 0.0404052734375, 0.04254150390625, 0.044677734375, 0.04681396484375, 0.0489501953125, 0.05108642578125, 0.05322265625, 0.05535888671875, 0.0574951171875, 0.05963134765625, 0.061767578125, 0.06390380859375, 0.0660400390625, 0.06817626953125, 0.0703125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 3.0, 7.0, 6.0, 3.0, 1.0, 8.0, 8.0, 11.0, 24.0, 15.0, 22.0, 32.0, 45.0, 59.0, 70.0, 88.0, 82.0, 77.0, 90.0, 70.0, 70.0, 47.0, 35.0, 28.0, 27.0, 18.0, 14.0, 9.0, 5.0, 6.0, 4.0, 4.0, 6.0, 4.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01763916015625, -0.017047643661499023, -0.016456127166748047, -0.01586461067199707, -0.015273094177246094, -0.014681577682495117, -0.01409006118774414, -0.013498544692993164, -0.012907028198242188, -0.012315511703491211, -0.011723995208740234, -0.011132478713989258, -0.010540962219238281, -0.009949445724487305, -0.009357929229736328, -0.008766412734985352, -0.008174896240234375, -0.0075833797454833984, -0.006991863250732422, -0.006400346755981445, -0.005808830261230469, -0.005217313766479492, -0.004625797271728516, -0.004034280776977539, -0.0034427642822265625, -0.002851247787475586, -0.0022597312927246094, -0.0016682147979736328, -0.0010766983032226562, -0.0004851818084716797, 0.00010633468627929688, 0.0006978511810302734, 0.00128936767578125, 0.0018808841705322266, 0.002472400665283203, 0.0030639171600341797, 0.0036554336547851562, 0.004246950149536133, 0.004838466644287109, 0.005429983139038086, 0.0060214996337890625, 0.006613016128540039, 0.007204532623291016, 0.007796049118041992, 0.008387565612792969, 0.008979082107543945, 0.009570598602294922, 0.010162115097045898, 0.010753631591796875, 0.011345148086547852, 0.011936664581298828, 0.012528181076049805, 0.013119697570800781, 0.013711214065551758, 0.014302730560302734, 0.014894247055053711, 0.015485763549804688, 0.016077280044555664, 0.01666879653930664, 0.017260313034057617, 0.017851829528808594, 0.01844334602355957, 0.019034862518310547, 0.019626379013061523, 0.0202178955078125]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 16.0, 113.0, 363.0, 373.0, 115.0, 20.0, 7.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.987186431884766, -8.596941947937012, -8.206696510314941, -7.8164520263671875, -7.426207542419434, -7.0359625816345215, -6.645717620849609, -6.2554731369018555, -5.865228176116943, -5.474983215332031, -5.084738731384277, -4.694493770599365, -4.304248809814453, -3.914004325866699, -3.523759365081787, -3.133514642715454, -2.743269920349121, -2.353025197982788, -1.9627803564071655, -1.572535514831543, -1.18229079246521, -0.792046070098877, -0.40180110931396484, -0.011556386947631836, 0.37868833541870117, 0.768933117389679, 1.1591778993606567, 1.5494227409362793, 1.9396674633026123, 2.3299121856689453, 2.7201571464538574, 3.1104018688201904, 3.5006465911865234, 3.8908913135528564, 4.2811360359191895, 4.671380996704102, 5.0616254806518555, 5.451870441436768, 5.84211540222168, 6.232359886169434, 6.622604846954346, 7.012849807739258, 7.403094291687012, 7.793339252471924, 8.183584213256836, 8.57382869720459, 8.964073181152344, 9.354318618774414, 9.744563102722168, 10.134807586669922, 10.525053024291992, 10.915297508239746, 11.3055419921875, 11.69578742980957, 12.086031913757324, 12.476276397705078, 12.866521835327148, 13.256766319274902, 13.647011756896973, 14.037256240844727, 14.42750072479248, 14.817745208740234, 15.207990646362305, 15.598235130310059, 15.988479614257812]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 2.0, 4.0, 1.0, 7.0, 4.0, 4.0, 12.0, 15.0, 17.0, 24.0, 31.0, 23.0, 42.0, 49.0, 45.0, 56.0, 77.0, 67.0, 68.0, 75.0, 65.0, 47.0, 47.0, 45.0, 38.0, 37.0, 22.0, 19.0, 18.0, 16.0, 3.0, 8.0, 7.0, 4.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.84909725189209, -2.7684621810913086, -2.6878268718719482, -2.607191801071167, -2.5265567302703857, -2.4459214210510254, -2.365286350250244, -2.284651279449463, -2.2040159702301025, -2.1233808994293213, -2.042745590209961, -1.9621105194091797, -1.8814753293991089, -1.800840139389038, -1.7202050685882568, -1.639569878578186, -1.5589348077774048, -1.478299617767334, -1.3976645469665527, -1.317029356956482, -1.2363941669464111, -1.1557590961456299, -1.075123906135559, -0.9944887161254883, -0.9138535857200623, -0.8332184553146362, -0.7525832653045654, -0.6719481348991394, -0.5913130044937134, -0.5106778144836426, -0.43004268407821655, -0.34940749406814575, -0.2687723636627197, -0.1881372034549713, -0.1075020581483841, -0.026866912841796875, 0.05376824736595154, 0.13440340757369995, 0.21503853797912598, 0.2956737279891968, 0.3763088583946228, 0.4569440186023712, 0.5375791788101196, 0.6182143092155457, 0.6988494396209717, 0.7794846296310425, 0.8601197600364685, 0.9407549500465393, 1.0213900804519653, 1.1020252704620361, 1.1826603412628174, 1.2632955312728882, 1.343930721282959, 1.4245657920837402, 1.505200982093811, 1.5858361721038818, 1.666471242904663, 1.7471064329147339, 1.8277415037155151, 1.908376693725586, 1.9890118837356567, 2.0696470737457275, 2.150282144546509, 2.230917453765869, 2.3115525245666504]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 0.0, 2.0, 2.0, 5.0, 6.0, 7.0, 9.0, 6.0, 9.0, 5.0, 11.0, 14.0, 10.0, 20.0, 16.0, 32.0, 46.0, 69.0, 121.0, 476.0, 4473.0, 73933.0, 705773.0, 247476.0, 14392.0, 1107.0, 202.0, 82.0, 60.0, 49.0, 32.0, 22.0, 20.0, 14.0, 12.0, 11.0, 8.0, 4.0, 7.0, 6.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.11328125, -5.9205322265625, -5.727783203125, -5.5350341796875, -5.34228515625, -5.1495361328125, -4.956787109375, -4.7640380859375, -4.5712890625, -4.3785400390625, -4.185791015625, -3.9930419921875, -3.80029296875, -3.6075439453125, -3.414794921875, -3.2220458984375, -3.029296875, -2.8365478515625, -2.643798828125, -2.4510498046875, -2.25830078125, -2.0655517578125, -1.872802734375, -1.6800537109375, -1.4873046875, -1.2945556640625, -1.101806640625, -0.9090576171875, -0.71630859375, -0.5235595703125, -0.330810546875, -0.1380615234375, 0.0546875, 0.2474365234375, 0.440185546875, 0.6329345703125, 0.82568359375, 1.0184326171875, 1.211181640625, 1.4039306640625, 1.5966796875, 1.7894287109375, 1.982177734375, 2.1749267578125, 2.36767578125, 2.5604248046875, 2.753173828125, 2.9459228515625, 3.138671875, 3.3314208984375, 3.524169921875, 3.7169189453125, 3.90966796875, 4.1024169921875, 4.295166015625, 4.4879150390625, 4.6806640625, 4.8734130859375, 5.066162109375, 5.2589111328125, 5.45166015625, 5.6444091796875, 5.837158203125, 6.0299072265625, 6.22265625]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 5.0, 7.0, 16.0, 20.0, 57.0, 67.0, 107.0, 164.0, 163.0, 152.0, 92.0, 79.0, 41.0, 24.0, 8.0, 8.0, 5.0, 1.0, 0.0, 2.0], "bins": [-17.25, -16.920684814453125, -16.59136962890625, -16.262054443359375, -15.9327392578125, -15.603424072265625, -15.27410888671875, -14.944793701171875, -14.615478515625, -14.286163330078125, -13.95684814453125, -13.627532958984375, -13.2982177734375, -12.968902587890625, -12.63958740234375, -12.310272216796875, -11.98095703125, -11.651641845703125, -11.32232666015625, -10.993011474609375, -10.6636962890625, -10.334381103515625, -10.00506591796875, -9.675750732421875, -9.346435546875, -9.017120361328125, -8.68780517578125, -8.358489990234375, -8.0291748046875, -7.699859619140625, -7.37054443359375, -7.041229248046875, -6.7119140625, -6.382598876953125, -6.05328369140625, -5.723968505859375, -5.3946533203125, -5.065338134765625, -4.73602294921875, -4.406707763671875, -4.077392578125, -3.748077392578125, -3.41876220703125, -3.089447021484375, -2.7601318359375, -2.430816650390625, -2.10150146484375, -1.772186279296875, -1.44287109375, -1.113555908203125, -0.78424072265625, -0.454925537109375, -0.1256103515625, 0.203704833984375, 0.53302001953125, 0.862335205078125, 1.191650390625, 1.520965576171875, 1.85028076171875, 2.179595947265625, 2.5089111328125, 2.838226318359375, 3.16754150390625, 3.496856689453125, 3.826171875]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 6.0, 5.0, 12.0, 28.0, 29.0, 40.0, 47.0, 76.0, 103.0, 95.0, 128.0, 159.0, 248.0, 382.0, 1045.0, 10683.0, 260721.0, 721425.0, 49149.0, 2541.0, 528.0, 271.0, 209.0, 157.0, 122.0, 98.0, 68.0, 61.0, 38.0, 24.0, 21.0, 13.0, 6.0, 6.0, 9.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.99609375, -5.80413818359375, -5.6121826171875, -5.42022705078125, -5.228271484375, -5.03631591796875, -4.8443603515625, -4.65240478515625, -4.46044921875, -4.26849365234375, -4.0765380859375, -3.88458251953125, -3.692626953125, -3.50067138671875, -3.3087158203125, -3.11676025390625, -2.9248046875, -2.73284912109375, -2.5408935546875, -2.34893798828125, -2.156982421875, -1.96502685546875, -1.7730712890625, -1.58111572265625, -1.38916015625, -1.19720458984375, -1.0052490234375, -0.81329345703125, -0.621337890625, -0.42938232421875, -0.2374267578125, -0.04547119140625, 0.146484375, 0.33843994140625, 0.5303955078125, 0.72235107421875, 0.914306640625, 1.10626220703125, 1.2982177734375, 1.49017333984375, 1.68212890625, 1.87408447265625, 2.0660400390625, 2.25799560546875, 2.449951171875, 2.64190673828125, 2.8338623046875, 3.02581787109375, 3.2177734375, 3.40972900390625, 3.6016845703125, 3.79364013671875, 3.985595703125, 4.17755126953125, 4.3695068359375, 4.56146240234375, 4.75341796875, 4.94537353515625, 5.1373291015625, 5.32928466796875, 5.521240234375, 5.71319580078125, 5.9051513671875, 6.09710693359375, 6.2890625]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 6.0, 6.0, 8.0, 8.0, 14.0, 12.0, 23.0, 29.0, 35.0, 27.0, 32.0, 41.0, 42.0, 34.0, 44.0, 43.0, 46.0, 37.0, 51.0, 61.0, 50.0, 57.0, 41.0, 35.0, 24.0, 37.0, 39.0, 23.0, 19.0, 16.0, 12.0, 16.0, 6.0, 4.0, 2.0, 5.0, 6.0, 3.0, 4.0, 1.0, 4.0, 3.0, 0.0, 1.0, 1.0], "bins": [-4.2265625, -4.112762451171875, -3.99896240234375, -3.885162353515625, -3.7713623046875, -3.657562255859375, -3.54376220703125, -3.429962158203125, -3.316162109375, -3.202362060546875, -3.08856201171875, -2.974761962890625, -2.8609619140625, -2.747161865234375, -2.63336181640625, -2.519561767578125, -2.40576171875, -2.291961669921875, -2.17816162109375, -2.064361572265625, -1.9505615234375, -1.836761474609375, -1.72296142578125, -1.609161376953125, -1.495361328125, -1.381561279296875, -1.26776123046875, -1.153961181640625, -1.0401611328125, -0.926361083984375, -0.81256103515625, -0.698760986328125, -0.5849609375, -0.471160888671875, -0.35736083984375, -0.243560791015625, -0.1297607421875, -0.015960693359375, 0.09783935546875, 0.211639404296875, 0.325439453125, 0.439239501953125, 0.55303955078125, 0.666839599609375, 0.7806396484375, 0.894439697265625, 1.00823974609375, 1.122039794921875, 1.23583984375, 1.349639892578125, 1.46343994140625, 1.577239990234375, 1.6910400390625, 1.804840087890625, 1.91864013671875, 2.032440185546875, 2.146240234375, 2.260040283203125, 2.37384033203125, 2.487640380859375, 2.6014404296875, 2.715240478515625, 2.82904052734375, 2.942840576171875, 3.056640625]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 4.0, 3.0, 4.0, 3.0, 3.0, 3.0, 8.0, 5.0, 9.0, 17.0, 25.0, 29.0, 87.0, 145.0, 425.0, 1713.0, 11048.0, 384600.0, 631699.0, 15569.0, 2266.0, 514.0, 165.0, 72.0, 46.0, 22.0, 10.0, 13.0, 14.0, 10.0, 0.0, 4.0, 5.0, 3.0, 3.0, 2.0, 2.0, 4.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.98046875, -2.884552001953125, -2.78863525390625, -2.692718505859375, -2.5968017578125, -2.500885009765625, -2.40496826171875, -2.309051513671875, -2.213134765625, -2.117218017578125, -2.02130126953125, -1.925384521484375, -1.8294677734375, -1.733551025390625, -1.63763427734375, -1.541717529296875, -1.44580078125, -1.349884033203125, -1.25396728515625, -1.158050537109375, -1.0621337890625, -0.966217041015625, -0.87030029296875, -0.774383544921875, -0.678466796875, -0.582550048828125, -0.48663330078125, -0.390716552734375, -0.2947998046875, -0.198883056640625, -0.10296630859375, -0.007049560546875, 0.0888671875, 0.184783935546875, 0.28070068359375, 0.376617431640625, 0.4725341796875, 0.568450927734375, 0.66436767578125, 0.760284423828125, 0.856201171875, 0.952117919921875, 1.04803466796875, 1.143951416015625, 1.2398681640625, 1.335784912109375, 1.43170166015625, 1.527618408203125, 1.62353515625, 1.719451904296875, 1.81536865234375, 1.911285400390625, 2.0072021484375, 2.103118896484375, 2.19903564453125, 2.294952392578125, 2.390869140625, 2.486785888671875, 2.58270263671875, 2.678619384765625, 2.7745361328125, 2.870452880859375, 2.96636962890625, 3.062286376953125, 3.158203125]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 8.0, 3.0, 21.0, 18.0, 24.0, 28.0, 35.0, 68.0, 76.0, 91.0, 96.0, 98.0, 87.0, 83.0, 58.0, 60.0, 32.0, 24.0, 27.0, 14.0, 10.0, 11.0, 6.0, 3.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00021398067474365234, -0.0002077445387840271, -0.00020150840282440186, -0.0001952722668647766, -0.00018903613090515137, -0.00018279999494552612, -0.00017656385898590088, -0.00017032772302627563, -0.0001640915870666504, -0.00015785545110702515, -0.0001516193151473999, -0.00014538317918777466, -0.00013914704322814941, -0.00013291090726852417, -0.00012667477130889893, -0.00012043863534927368, -0.00011420249938964844, -0.0001079663634300232, -0.00010173022747039795, -9.54940915107727e-05, -8.925795555114746e-05, -8.302181959152222e-05, -7.678568363189697e-05, -7.054954767227173e-05, -6.431341171264648e-05, -5.807727575302124e-05, -5.1841139793395996e-05, -4.560500383377075e-05, -3.936886787414551e-05, -3.3132731914520264e-05, -2.689659595489502e-05, -2.0660459995269775e-05, -1.4424324035644531e-05, -8.188188076019287e-06, -1.952052116394043e-06, 4.284083843231201e-06, 1.0520219802856445e-05, 1.675635576248169e-05, 2.2992491722106934e-05, 2.9228627681732178e-05, 3.546476364135742e-05, 4.1700899600982666e-05, 4.793703556060791e-05, 5.4173171520233154e-05, 6.04093074798584e-05, 6.664544343948364e-05, 7.288157939910889e-05, 7.911771535873413e-05, 8.535385131835938e-05, 9.158998727798462e-05, 9.782612323760986e-05, 0.00010406225919723511, 0.00011029839515686035, 0.0001165345311164856, 0.00012277066707611084, 0.00012900680303573608, 0.00013524293899536133, 0.00014147907495498657, 0.00014771521091461182, 0.00015395134687423706, 0.0001601874828338623, 0.00016642361879348755, 0.0001726597547531128, 0.00017889589071273804, 0.00018513202667236328]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 7.0, 8.0, 5.0, 11.0, 13.0, 17.0, 29.0, 49.0, 70.0, 175.0, 442.0, 2333.0, 31065.0, 917374.0, 91851.0, 3989.0, 675.0, 207.0, 99.0, 45.0, 20.0, 18.0, 6.0, 16.0, 6.0, 3.0, 4.0, 7.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.39453125, -3.287200927734375, -3.17987060546875, -3.072540283203125, -2.9652099609375, -2.857879638671875, -2.75054931640625, -2.643218994140625, -2.535888671875, -2.428558349609375, -2.32122802734375, -2.213897705078125, -2.1065673828125, -1.999237060546875, -1.89190673828125, -1.784576416015625, -1.67724609375, -1.569915771484375, -1.46258544921875, -1.355255126953125, -1.2479248046875, -1.140594482421875, -1.03326416015625, -0.925933837890625, -0.818603515625, -0.711273193359375, -0.60394287109375, -0.496612548828125, -0.3892822265625, -0.281951904296875, -0.17462158203125, -0.067291259765625, 0.0400390625, 0.147369384765625, 0.25469970703125, 0.362030029296875, 0.4693603515625, 0.576690673828125, 0.68402099609375, 0.791351318359375, 0.898681640625, 1.006011962890625, 1.11334228515625, 1.220672607421875, 1.3280029296875, 1.435333251953125, 1.54266357421875, 1.649993896484375, 1.75732421875, 1.864654541015625, 1.97198486328125, 2.079315185546875, 2.1866455078125, 2.293975830078125, 2.40130615234375, 2.508636474609375, 2.615966796875, 2.723297119140625, 2.83062744140625, 2.937957763671875, 3.0452880859375, 3.152618408203125, 3.25994873046875, 3.367279052734375, 3.474609375]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 8.0, 7.0, 8.0, 17.0, 26.0, 35.0, 52.0, 66.0, 79.0, 102.0, 110.0, 97.0, 98.0, 81.0, 58.0, 50.0, 26.0, 21.0, 11.0, 13.0, 6.0, 8.0, 3.0, 1.0, 5.0, 6.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.57275390625, -0.5522308349609375, -0.531707763671875, -0.5111846923828125, -0.49066162109375, -0.4701385498046875, -0.449615478515625, -0.4290924072265625, -0.4085693359375, -0.3880462646484375, -0.367523193359375, -0.3470001220703125, -0.32647705078125, -0.3059539794921875, -0.285430908203125, -0.2649078369140625, -0.244384765625, -0.2238616943359375, -0.203338623046875, -0.1828155517578125, -0.16229248046875, -0.1417694091796875, -0.121246337890625, -0.1007232666015625, -0.0802001953125, -0.0596771240234375, -0.039154052734375, -0.0186309814453125, 0.00189208984375, 0.0224151611328125, 0.042938232421875, 0.0634613037109375, 0.083984375, 0.1045074462890625, 0.125030517578125, 0.1455535888671875, 0.16607666015625, 0.1865997314453125, 0.207122802734375, 0.2276458740234375, 0.2481689453125, 0.2686920166015625, 0.289215087890625, 0.3097381591796875, 0.33026123046875, 0.3507843017578125, 0.371307373046875, 0.3918304443359375, 0.412353515625, 0.4328765869140625, 0.453399658203125, 0.4739227294921875, 0.49444580078125, 0.5149688720703125, 0.535491943359375, 0.5560150146484375, 0.5765380859375, 0.5970611572265625, 0.617584228515625, 0.6381072998046875, 0.65863037109375, 0.6791534423828125, 0.699676513671875, 0.7201995849609375, 0.74072265625]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 6.0, 17.0, 11.0, 25.0, 47.0, 47.0, 77.0, 107.0, 114.0, 123.0, 118.0, 89.0, 66.0, 57.0, 35.0, 18.0, 16.0, 11.0, 8.0, 4.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.46297025680542, -6.257547855377197, -6.052124977111816, -5.846702575683594, -5.641280174255371, -5.435857772827148, -5.230434894561768, -5.025012493133545, -4.819589614868164, -4.614167213439941, -4.4087443351745605, -4.203321933746338, -3.9978995323181152, -3.7924768924713135, -3.5870542526245117, -3.381631851196289, -3.1762094497680664, -2.9707868099212646, -2.765364408493042, -2.5599417686462402, -2.3545193672180176, -2.149096727371216, -1.943674087524414, -1.7382515668869019, -1.5328290462493896, -1.3274065256118774, -1.1219840049743652, -0.9165613651275635, -0.7111388444900513, -0.5057163238525391, -0.3002936840057373, -0.0948711633682251, 0.11055135726928711, 0.3159739077091217, 0.5213964581489563, 0.7268190383911133, 0.9322415590286255, 1.1376640796661377, 1.3430867195129395, 1.5485092401504517, 1.7539317607879639, 1.959354281425476, 2.1647768020629883, 2.37019944190979, 2.575622081756592, 2.7810444831848145, 2.986467123031616, 3.191889762878418, 3.3973121643066406, 3.6027348041534424, 3.808157205581665, 4.013579845428467, 4.2190022468566895, 4.42442512512207, 4.629847526550293, 4.835269927978516, 5.040692329406738, 5.246114730834961, 5.451537609100342, 5.6569600105285645, 5.862382411956787, 6.067805290222168, 6.273227691650391, 6.478650093078613, 6.684072971343994]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 7.0, 3.0, 7.0, 12.0, 11.0, 18.0, 26.0, 26.0, 38.0, 40.0, 34.0, 61.0, 65.0, 66.0, 66.0, 61.0, 67.0, 76.0, 62.0, 60.0, 44.0, 39.0, 34.0, 24.0, 21.0, 17.0, 11.0, 4.0, 7.0, 5.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-11.972057342529297, -11.689726829528809, -11.40739631652832, -11.125065803527832, -10.842735290527344, -10.560403823852539, -10.278074264526367, -9.995742797851562, -9.713412284851074, -9.431081771850586, -9.148751258850098, -8.86642074584961, -8.584090232849121, -8.301759719848633, -8.019428253173828, -7.737098217010498, -7.45476770401001, -7.1724371910095215, -6.890106678009033, -6.607775688171387, -6.325445175170898, -6.04311466217041, -5.760784149169922, -5.478453636169434, -5.196123123168945, -4.913792610168457, -4.631462097167969, -4.3491315841674805, -4.066800594329834, -3.7844700813293457, -3.5021395683288574, -3.219809055328369, -2.9374780654907227, -2.6551475524902344, -2.372816801071167, -2.0904862880706787, -1.8081556558609009, -1.525825023651123, -1.2434945106506348, -0.9611638784408569, -0.6788332462310791, -0.39650264382362366, -0.11417204141616821, 0.16815853118896484, 0.4504891633987427, 0.7328197956085205, 1.0151503086090088, 1.2974809408187866, 1.5798115730285645, 1.8621422052383423, 2.14447283744812, 2.4268033504486084, 2.709134101867676, 2.991464614868164, 3.2737951278686523, 3.5561256408691406, 3.838456392288208, 4.120787143707275, 4.403117656707764, 4.685448169708252, 4.96777868270874, 5.250109672546387, 5.532440185546875, 5.814770698547363, 6.097101211547852]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 5.0, 4.0, 2.0, 6.0, 3.0, 15.0, 16.0, 28.0, 35.0, 50.0, 68.0, 106.0, 149.0, 253.0, 447.0, 946.0, 4906.0, 97344.0, 2601769.0, 1441915.0, 42289.0, 2613.0, 571.0, 277.0, 156.0, 100.0, 72.0, 48.0, 34.0, 15.0, 9.0, 11.0, 11.0, 4.0, 2.0, 5.0, 4.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.94921875, -4.73284912109375, -4.5164794921875, -4.30010986328125, -4.083740234375, -3.86737060546875, -3.6510009765625, -3.43463134765625, -3.21826171875, -3.00189208984375, -2.7855224609375, -2.56915283203125, -2.352783203125, -2.13641357421875, -1.9200439453125, -1.70367431640625, -1.4873046875, -1.27093505859375, -1.0545654296875, -0.83819580078125, -0.621826171875, -0.40545654296875, -0.1890869140625, 0.02728271484375, 0.24365234375, 0.46002197265625, 0.6763916015625, 0.89276123046875, 1.109130859375, 1.32550048828125, 1.5418701171875, 1.75823974609375, 1.974609375, 2.19097900390625, 2.4073486328125, 2.62371826171875, 2.840087890625, 3.05645751953125, 3.2728271484375, 3.48919677734375, 3.70556640625, 3.92193603515625, 4.1383056640625, 4.35467529296875, 4.571044921875, 4.78741455078125, 5.0037841796875, 5.22015380859375, 5.4365234375, 5.65289306640625, 5.8692626953125, 6.08563232421875, 6.302001953125, 6.51837158203125, 6.7347412109375, 6.95111083984375, 7.16748046875, 7.38385009765625, 7.6002197265625, 7.81658935546875, 8.032958984375, 8.24932861328125, 8.4656982421875, 8.68206787109375, 8.8984375]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 5.0, 0.0, 2.0, 2.0, 4.0, 4.0, 3.0, 4.0, 4.0, 7.0, 5.0, 12.0, 14.0, 16.0, 26.0, 26.0, 23.0, 38.0, 44.0, 42.0, 38.0, 55.0, 51.0, 64.0, 50.0, 66.0, 48.0, 46.0, 46.0, 44.0, 30.0, 46.0, 27.0, 21.0, 18.0, 17.0, 12.0, 18.0, 9.0, 10.0, 5.0, 4.0, 1.0, 7.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.587890625, -2.49700927734375, -2.4061279296875, -2.31524658203125, -2.224365234375, -2.13348388671875, -2.0426025390625, -1.95172119140625, -1.86083984375, -1.76995849609375, -1.6790771484375, -1.58819580078125, -1.497314453125, -1.40643310546875, -1.3155517578125, -1.22467041015625, -1.1337890625, -1.04290771484375, -0.9520263671875, -0.86114501953125, -0.770263671875, -0.67938232421875, -0.5885009765625, -0.49761962890625, -0.40673828125, -0.31585693359375, -0.2249755859375, -0.13409423828125, -0.043212890625, 0.04766845703125, 0.1385498046875, 0.22943115234375, 0.3203125, 0.41119384765625, 0.5020751953125, 0.59295654296875, 0.683837890625, 0.77471923828125, 0.8656005859375, 0.95648193359375, 1.04736328125, 1.13824462890625, 1.2291259765625, 1.32000732421875, 1.410888671875, 1.50177001953125, 1.5926513671875, 1.68353271484375, 1.7744140625, 1.86529541015625, 1.9561767578125, 2.04705810546875, 2.137939453125, 2.22882080078125, 2.3197021484375, 2.41058349609375, 2.50146484375, 2.59234619140625, 2.6832275390625, 2.77410888671875, 2.864990234375, 2.95587158203125, 3.0467529296875, 3.13763427734375, 3.228515625]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 7.0, 8.0, 10.0, 31.0, 81.0, 240.0, 691.0, 3497.0, 225773.0, 3938379.0, 23183.0, 1672.0, 436.0, 181.0, 62.0, 23.0, 12.0, 3.0, 3.0, 4.0], "bins": [-18.015625, -17.677642822265625, -17.33966064453125, -17.001678466796875, -16.6636962890625, -16.325714111328125, -15.98773193359375, -15.649749755859375, -15.311767578125, -14.973785400390625, -14.63580322265625, -14.297821044921875, -13.9598388671875, -13.621856689453125, -13.28387451171875, -12.945892333984375, -12.60791015625, -12.269927978515625, -11.93194580078125, -11.593963623046875, -11.2559814453125, -10.917999267578125, -10.58001708984375, -10.242034912109375, -9.904052734375, -9.566070556640625, -9.22808837890625, -8.890106201171875, -8.5521240234375, -8.214141845703125, -7.87615966796875, -7.538177490234375, -7.2001953125, -6.862213134765625, -6.52423095703125, -6.186248779296875, -5.8482666015625, -5.510284423828125, -5.17230224609375, -4.834320068359375, -4.496337890625, -4.158355712890625, -3.82037353515625, -3.482391357421875, -3.1444091796875, -2.806427001953125, -2.46844482421875, -2.130462646484375, -1.79248046875, -1.454498291015625, -1.11651611328125, -0.778533935546875, -0.4405517578125, -0.102569580078125, 0.23541259765625, 0.573394775390625, 0.911376953125, 1.249359130859375, 1.58734130859375, 1.925323486328125, 2.2633056640625, 2.601287841796875, 2.93927001953125, 3.277252197265625, 3.615234375]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 8.0, 7.0, 8.0, 14.0, 24.0, 31.0, 27.0, 38.0, 59.0, 82.0, 106.0, 149.0, 222.0, 278.0, 329.0, 444.0, 464.0, 437.0, 328.0, 267.0, 212.0, 157.0, 98.0, 76.0, 61.0, 41.0, 33.0, 30.0, 14.0, 5.0, 5.0, 6.0, 2.0, 1.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0], "bins": [-1.083984375, -1.0533676147460938, -1.0227508544921875, -0.9921340942382812, -0.961517333984375, -0.9309005737304688, -0.9002838134765625, -0.8696670532226562, -0.83905029296875, -0.8084335327148438, -0.7778167724609375, -0.7472000122070312, -0.716583251953125, -0.6859664916992188, -0.6553497314453125, -0.6247329711914062, -0.5941162109375, -0.5634994506835938, -0.5328826904296875, -0.5022659301757812, -0.471649169921875, -0.44103240966796875, -0.4104156494140625, -0.37979888916015625, -0.34918212890625, -0.31856536865234375, -0.2879486083984375, -0.25733184814453125, -0.226715087890625, -0.19609832763671875, -0.1654815673828125, -0.13486480712890625, -0.104248046875, -0.07363128662109375, -0.0430145263671875, -0.01239776611328125, 0.018218994140625, 0.04883575439453125, 0.0794525146484375, 0.11006927490234375, 0.14068603515625, 0.17130279541015625, 0.2019195556640625, 0.23253631591796875, 0.263153076171875, 0.29376983642578125, 0.3243865966796875, 0.35500335693359375, 0.3856201171875, 0.41623687744140625, 0.4468536376953125, 0.47747039794921875, 0.508087158203125, 0.5387039184570312, 0.5693206787109375, 0.5999374389648438, 0.63055419921875, 0.6611709594726562, 0.6917877197265625, 0.7224044799804688, 0.753021240234375, 0.7836380004882812, 0.8142547607421875, 0.8448715209960938, 0.87548828125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 8.0, 6.0, 15.0, 13.0, 27.0, 47.0, 72.0, 101.0, 117.0, 126.0, 130.0, 100.0, 83.0, 72.0, 27.0, 31.0, 19.0, 6.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.511949062347412, -5.320488929748535, -5.129029273986816, -4.9375691413879395, -4.746109485626221, -4.554649353027344, -4.363189697265625, -4.171729564666748, -3.98026967048645, -3.7888097763061523, -3.5973498821258545, -3.4058899879455566, -3.2144298553466797, -3.022970199584961, -2.831510066986084, -2.640050172805786, -2.4485902786254883, -2.2571303844451904, -2.0656704902648926, -1.8742104768753052, -1.6827505826950073, -1.4912906885147095, -1.299830675125122, -1.1083707809448242, -0.9169108867645264, -0.7254509925842285, -0.5339910387992859, -0.34253108501434326, -0.1510711908340454, 0.04038870334625244, 0.23184871673583984, 0.4233086109161377, 0.6147680282592773, 0.8062279224395752, 0.9976878762245178, 1.1891478300094604, 1.3806077241897583, 1.5720676183700562, 1.7635276317596436, 1.9549875259399414, 2.1464474201202393, 2.337907314300537, 2.529367208480835, 2.720827102661133, 2.9122872352600098, 3.1037468910217285, 3.2952070236206055, 3.4866669178009033, 3.678126811981201, 3.869586706161499, 4.061046600341797, 4.252506732940674, 4.443966388702393, 4.6354265213012695, 4.826886177062988, 5.018346309661865, 5.209806442260742, 5.401266574859619, 5.592726230621338, 5.784186363220215, 5.975646018981934, 6.1671061515808105, 6.3585662841796875, 6.550025939941406, 6.741485595703125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 2.0, 3.0, 6.0, 7.0, 6.0, 12.0, 11.0, 16.0, 13.0, 25.0, 20.0, 24.0, 28.0, 39.0, 43.0, 42.0, 39.0, 54.0, 45.0, 41.0, 34.0, 53.0, 41.0, 42.0, 38.0, 44.0, 43.0, 35.0, 35.0, 26.0, 22.0, 18.0, 17.0, 16.0, 17.0, 13.0, 8.0, 5.0, 4.0, 5.0, 4.0, 4.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8771300315856934, -2.7858071327209473, -2.6944844722747803, -2.603161573410034, -2.511838912963867, -2.420516014099121, -2.329193115234375, -2.237870454788208, -2.146547794342041, -2.055224895477295, -1.963902235031128, -1.8725793361663818, -1.7812566757202148, -1.6899337768554688, -1.5986109972000122, -1.5072882175445557, -1.4159653186798096, -1.324642539024353, -1.2333197593688965, -1.1419968605041504, -1.0506742000579834, -0.9593513607978821, -0.8680285215377808, -0.7767057418823242, -0.6853829622268677, -0.5940601825714111, -0.5027374029159546, -0.41141456365585327, -0.32009178400039673, -0.22876900434494019, -0.13744616508483887, -0.046123385429382324, 0.04519963264465332, 0.13652242720127106, 0.2278452217578888, 0.3191680312156677, 0.41049081087112427, 0.5018135905265808, 0.5931364297866821, 0.6844592094421387, 0.7757819890975952, 0.8671047687530518, 0.9584275484085083, 1.0497503280639648, 1.141073226928711, 1.232395887374878, 1.323718786239624, 1.4150415658950806, 1.506364345550537, 1.5976871252059937, 1.6890099048614502, 1.7803328037261963, 1.8716554641723633, 1.9629783630371094, 2.0543012619018555, 2.1456239223480225, 2.2369465827941895, 2.3282694816589355, 2.4195921421051025, 2.5109150409698486, 2.6022377014160156, 2.6935606002807617, 2.784883499145508, 2.876206159591675, 2.967529058456421]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 5.0, 3.0, 8.0, 22.0, 23.0, 27.0, 44.0, 52.0, 71.0, 132.0, 226.0, 354.0, 572.0, 956.0, 1746.0, 3144.0, 6207.0, 12833.0, 28790.0, 66350.0, 153648.0, 275533.0, 258096.0, 134569.0, 57170.0, 24483.0, 11215.0, 5580.0, 2920.0, 1571.0, 869.0, 495.0, 313.0, 187.0, 112.0, 73.0, 46.0, 28.0, 25.0, 23.0, 16.0, 8.0, 7.0, 3.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.44287109375, -0.42899322509765625, -0.4151153564453125, -0.40123748779296875, -0.387359619140625, -0.37348175048828125, -0.3596038818359375, -0.34572601318359375, -0.33184814453125, -0.31797027587890625, -0.3040924072265625, -0.29021453857421875, -0.276336669921875, -0.26245880126953125, -0.2485809326171875, -0.23470306396484375, -0.2208251953125, -0.20694732666015625, -0.1930694580078125, -0.17919158935546875, -0.165313720703125, -0.15143585205078125, -0.1375579833984375, -0.12368011474609375, -0.10980224609375, -0.09592437744140625, -0.0820465087890625, -0.06816864013671875, -0.054290771484375, -0.04041290283203125, -0.0265350341796875, -0.01265716552734375, 0.001220703125, 0.01509857177734375, 0.0289764404296875, 0.04285430908203125, 0.056732177734375, 0.07061004638671875, 0.0844879150390625, 0.09836578369140625, 0.11224365234375, 0.12612152099609375, 0.1399993896484375, 0.15387725830078125, 0.167755126953125, 0.18163299560546875, 0.1955108642578125, 0.20938873291015625, 0.2232666015625, 0.23714447021484375, 0.2510223388671875, 0.26490020751953125, 0.278778076171875, 0.29265594482421875, 0.3065338134765625, 0.32041168212890625, 0.33428955078125, 0.34816741943359375, 0.3620452880859375, 0.37592315673828125, 0.389801025390625, 0.40367889404296875, 0.4175567626953125, 0.43143463134765625, 0.4453125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 3.0, 5.0, 8.0, 9.0, 12.0, 22.0, 21.0, 25.0, 30.0, 43.0, 34.0, 52.0, 62.0, 58.0, 55.0, 61.0, 43.0, 59.0, 70.0, 55.0, 39.0, 52.0, 38.0, 28.0, 24.0, 21.0, 10.0, 18.0, 10.0, 8.0, 11.0, 6.0, 3.0, 5.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.548828125, -2.467010498046875, -2.38519287109375, -2.303375244140625, -2.2215576171875, -2.139739990234375, -2.05792236328125, -1.976104736328125, -1.894287109375, -1.812469482421875, -1.73065185546875, -1.648834228515625, -1.5670166015625, -1.485198974609375, -1.40338134765625, -1.321563720703125, -1.23974609375, -1.157928466796875, -1.07611083984375, -0.994293212890625, -0.9124755859375, -0.830657958984375, -0.74884033203125, -0.667022705078125, -0.585205078125, -0.503387451171875, -0.42156982421875, -0.339752197265625, -0.2579345703125, -0.176116943359375, -0.09429931640625, -0.012481689453125, 0.0693359375, 0.151153564453125, 0.23297119140625, 0.314788818359375, 0.3966064453125, 0.478424072265625, 0.56024169921875, 0.642059326171875, 0.723876953125, 0.805694580078125, 0.88751220703125, 0.969329833984375, 1.0511474609375, 1.132965087890625, 1.21478271484375, 1.296600341796875, 1.37841796875, 1.460235595703125, 1.54205322265625, 1.623870849609375, 1.7056884765625, 1.787506103515625, 1.86932373046875, 1.951141357421875, 2.032958984375, 2.114776611328125, 2.19659423828125, 2.278411865234375, 2.3602294921875, 2.442047119140625, 2.52386474609375, 2.605682373046875, 2.6875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 6.0, 4.0, 6.0, 9.0, 5.0, 11.0, 21.0, 21.0, 39.0, 61.0, 77.0, 147.0, 204.0, 332.0, 484.0, 741.0, 1201.0, 1873.0, 3055.0, 5017.0, 8202.0, 13491.0, 23394.0, 40524.0, 67484.0, 110160.0, 160717.0, 186401.0, 158030.0, 106512.0, 65031.0, 38272.0, 22630.0, 13485.0, 8028.0, 4730.0, 2931.0, 1900.0, 1168.0, 729.0, 517.0, 295.0, 206.0, 132.0, 79.0, 61.0, 48.0, 28.0, 18.0, 14.0, 8.0, 8.0, 9.0, 2.0, 5.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0], "bins": [-0.2294921875, -0.22195816040039062, -0.21442413330078125, -0.20689010620117188, -0.1993560791015625, -0.19182205200195312, -0.18428802490234375, -0.17675399780273438, -0.169219970703125, -0.16168594360351562, -0.15415191650390625, -0.14661788940429688, -0.1390838623046875, -0.13154983520507812, -0.12401580810546875, -0.11648178100585938, -0.10894775390625, -0.10141372680664062, -0.09387969970703125, -0.08634567260742188, -0.0788116455078125, -0.07127761840820312, -0.06374359130859375, -0.056209564208984375, -0.048675537109375, -0.041141510009765625, -0.03360748291015625, -0.026073455810546875, -0.0185394287109375, -0.011005401611328125, -0.00347137451171875, 0.004062652587890625, 0.0115966796875, 0.019130706787109375, 0.02666473388671875, 0.034198760986328125, 0.0417327880859375, 0.049266815185546875, 0.05680084228515625, 0.06433486938476562, 0.071868896484375, 0.07940292358398438, 0.08693695068359375, 0.09447097778320312, 0.1020050048828125, 0.10953903198242188, 0.11707305908203125, 0.12460708618164062, 0.13214111328125, 0.13967514038085938, 0.14720916748046875, 0.15474319458007812, 0.1622772216796875, 0.16981124877929688, 0.17734527587890625, 0.18487930297851562, 0.192413330078125, 0.19994735717773438, 0.20748138427734375, 0.21501541137695312, 0.2225494384765625, 0.23008346557617188, 0.23761749267578125, 0.24515151977539062, 0.252685546875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 7.0, 9.0, 4.0, 9.0, 13.0, 15.0, 16.0, 19.0, 19.0, 34.0, 38.0, 40.0, 45.0, 49.0, 34.0, 55.0, 66.0, 53.0, 73.0, 61.0, 48.0, 46.0, 41.0, 25.0, 38.0, 36.0, 22.0, 17.0, 6.0, 14.0, 12.0, 5.0, 15.0, 5.0, 4.0, 2.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.37109375, -4.22637939453125, -4.0816650390625, -3.93695068359375, -3.792236328125, -3.64752197265625, -3.5028076171875, -3.35809326171875, -3.21337890625, -3.06866455078125, -2.9239501953125, -2.77923583984375, -2.634521484375, -2.48980712890625, -2.3450927734375, -2.20037841796875, -2.0556640625, -1.91094970703125, -1.7662353515625, -1.62152099609375, -1.476806640625, -1.33209228515625, -1.1873779296875, -1.04266357421875, -0.89794921875, -0.75323486328125, -0.6085205078125, -0.46380615234375, -0.319091796875, -0.17437744140625, -0.0296630859375, 0.11505126953125, 0.259765625, 0.40447998046875, 0.5491943359375, 0.69390869140625, 0.838623046875, 0.98333740234375, 1.1280517578125, 1.27276611328125, 1.41748046875, 1.56219482421875, 1.7069091796875, 1.85162353515625, 1.996337890625, 2.14105224609375, 2.2857666015625, 2.43048095703125, 2.5751953125, 2.71990966796875, 2.8646240234375, 3.00933837890625, 3.154052734375, 3.29876708984375, 3.4434814453125, 3.58819580078125, 3.73291015625, 3.87762451171875, 4.0223388671875, 4.16705322265625, 4.311767578125, 4.45648193359375, 4.6011962890625, 4.74591064453125, 4.890625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 6.0, 6.0, 5.0, 8.0, 9.0, 22.0, 24.0, 36.0, 40.0, 75.0, 97.0, 104.0, 168.0, 261.0, 376.0, 588.0, 1026.0, 1775.0, 3116.0, 6365.0, 13612.0, 30505.0, 69323.0, 156522.0, 305313.0, 251205.0, 114324.0, 50166.0, 22395.0, 10122.0, 4784.0, 2453.0, 1359.0, 797.0, 513.0, 325.0, 209.0, 139.0, 116.0, 80.0, 59.0, 40.0, 19.0, 22.0, 18.0, 13.0, 4.0, 7.0, 7.0, 4.0, 3.0, 3.0, 0.0, 2.0], "bins": [-0.050537109375, -0.049085140228271484, -0.04763317108154297, -0.04618120193481445, -0.04472923278808594, -0.04327726364135742, -0.041825294494628906, -0.04037332534790039, -0.038921356201171875, -0.03746938705444336, -0.036017417907714844, -0.03456544876098633, -0.03311347961425781, -0.0316615104675293, -0.03020954132080078, -0.028757572174072266, -0.02730560302734375, -0.025853633880615234, -0.02440166473388672, -0.022949695587158203, -0.021497726440429688, -0.020045757293701172, -0.018593788146972656, -0.01714181900024414, -0.015689849853515625, -0.01423788070678711, -0.012785911560058594, -0.011333942413330078, -0.009881973266601562, -0.008430004119873047, -0.006978034973144531, -0.005526065826416016, -0.0040740966796875, -0.0026221275329589844, -0.0011701583862304688, 0.0002818107604980469, 0.0017337799072265625, 0.003185749053955078, 0.004637718200683594, 0.006089687347412109, 0.007541656494140625, 0.00899362564086914, 0.010445594787597656, 0.011897563934326172, 0.013349533081054688, 0.014801502227783203, 0.01625347137451172, 0.017705440521240234, 0.01915740966796875, 0.020609378814697266, 0.02206134796142578, 0.023513317108154297, 0.024965286254882812, 0.026417255401611328, 0.027869224548339844, 0.02932119369506836, 0.030773162841796875, 0.03222513198852539, 0.033677101135253906, 0.03512907028198242, 0.03658103942871094, 0.03803300857543945, 0.03948497772216797, 0.040936946868896484, 0.042388916015625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 9.0, 2.0, 14.0, 27.0, 28.0, 54.0, 61.0, 77.0, 118.0, 160.0, 105.0, 91.0, 83.0, 55.0, 36.0, 23.0, 24.0, 8.0, 10.0, 9.0, 7.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.413459777832031e-05, -6.196461617946625e-05, -5.979463458061218e-05, -5.762465298175812e-05, -5.545467138290405e-05, -5.328468978404999e-05, -5.111470818519592e-05, -4.894472658634186e-05, -4.677474498748779e-05, -4.460476338863373e-05, -4.243478178977966e-05, -4.02648001909256e-05, -3.809481859207153e-05, -3.592483699321747e-05, -3.37548553943634e-05, -3.158487379550934e-05, -2.9414892196655273e-05, -2.724491059780121e-05, -2.5074928998947144e-05, -2.290494740009308e-05, -2.0734965801239014e-05, -1.856498420238495e-05, -1.6395002603530884e-05, -1.4225021004676819e-05, -1.2055039405822754e-05, -9.885057806968689e-06, -7.715076208114624e-06, -5.545094609260559e-06, -3.375113010406494e-06, -1.2051314115524292e-06, 9.648501873016357e-07, 3.1348317861557007e-06, 5.304813385009766e-06, 7.4747949838638306e-06, 9.644776582717896e-06, 1.181475818157196e-05, 1.3984739780426025e-05, 1.615472137928009e-05, 1.8324702978134155e-05, 2.049468457698822e-05, 2.2664666175842285e-05, 2.483464777469635e-05, 2.7004629373550415e-05, 2.917461097240448e-05, 3.1344592571258545e-05, 3.351457417011261e-05, 3.5684555768966675e-05, 3.785453736782074e-05, 4.0024518966674805e-05, 4.219450056552887e-05, 4.4364482164382935e-05, 4.6534463763237e-05, 4.8704445362091064e-05, 5.087442696094513e-05, 5.3044408559799194e-05, 5.521439015865326e-05, 5.7384371757507324e-05, 5.955435335636139e-05, 6.172433495521545e-05, 6.389431655406952e-05, 6.606429815292358e-05, 6.823427975177765e-05, 7.040426135063171e-05, 7.257424294948578e-05, 7.474422454833984e-05]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 6.0, 2.0, 5.0, 9.0, 8.0, 17.0, 11.0, 22.0, 34.0, 35.0, 66.0, 76.0, 100.0, 146.0, 275.0, 518.0, 1115.0, 2315.0, 5406.0, 13584.0, 34173.0, 87625.0, 229940.0, 368730.0, 185153.0, 71345.0, 27986.0, 11228.0, 4555.0, 1939.0, 928.0, 422.0, 264.0, 154.0, 98.0, 70.0, 53.0, 40.0, 34.0, 24.0, 15.0, 9.0, 6.0, 5.0, 3.0, 4.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.04681396484375, -0.04522085189819336, -0.04362773895263672, -0.04203462600708008, -0.04044151306152344, -0.0388484001159668, -0.037255287170410156, -0.035662174224853516, -0.034069061279296875, -0.032475948333740234, -0.030882835388183594, -0.029289722442626953, -0.027696609497070312, -0.026103496551513672, -0.02451038360595703, -0.02291727066040039, -0.02132415771484375, -0.01973104476928711, -0.01813793182373047, -0.016544818878173828, -0.014951705932617188, -0.013358592987060547, -0.011765480041503906, -0.010172367095947266, -0.008579254150390625, -0.006986141204833984, -0.005393028259277344, -0.003799915313720703, -0.0022068023681640625, -0.0006136894226074219, 0.0009794235229492188, 0.0025725364685058594, 0.0041656494140625, 0.005758762359619141, 0.007351875305175781, 0.008944988250732422, 0.010538101196289062, 0.012131214141845703, 0.013724327087402344, 0.015317440032958984, 0.016910552978515625, 0.018503665924072266, 0.020096778869628906, 0.021689891815185547, 0.023283004760742188, 0.024876117706298828, 0.02646923065185547, 0.02806234359741211, 0.02965545654296875, 0.03124856948852539, 0.03284168243408203, 0.03443479537963867, 0.03602790832519531, 0.03762102127075195, 0.039214134216308594, 0.040807247161865234, 0.042400360107421875, 0.043993473052978516, 0.045586585998535156, 0.0471796989440918, 0.04877281188964844, 0.05036592483520508, 0.05195903778076172, 0.05355215072631836, 0.055145263671875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 3.0, 4.0, 7.0, 11.0, 13.0, 14.0, 23.0, 23.0, 28.0, 38.0, 43.0, 64.0, 63.0, 78.0, 88.0, 58.0, 70.0, 57.0, 59.0, 38.0, 36.0, 34.0, 18.0, 27.0, 20.0, 16.0, 14.0, 6.0, 8.0, 8.0, 6.0, 6.0, 2.0, 7.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01519012451171875, -0.014665961265563965, -0.01414179801940918, -0.013617634773254395, -0.01309347152709961, -0.012569308280944824, -0.012045145034790039, -0.011520981788635254, -0.010996818542480469, -0.010472655296325684, -0.009948492050170898, -0.009424328804016113, -0.008900165557861328, -0.008376002311706543, -0.007851839065551758, -0.007327675819396973, -0.0068035125732421875, -0.006279349327087402, -0.005755186080932617, -0.005231022834777832, -0.004706859588623047, -0.004182696342468262, -0.0036585330963134766, -0.0031343698501586914, -0.0026102066040039062, -0.002086043357849121, -0.001561880111694336, -0.0010377168655395508, -0.0005135536193847656, 1.0609626770019531e-05, 0.0005347728729248047, 0.0010589361190795898, 0.001583099365234375, 0.00210726261138916, 0.0026314258575439453, 0.0031555891036987305, 0.0036797523498535156, 0.004203915596008301, 0.004728078842163086, 0.005252242088317871, 0.005776405334472656, 0.006300568580627441, 0.0068247318267822266, 0.007348895072937012, 0.007873058319091797, 0.008397221565246582, 0.008921384811401367, 0.009445548057556152, 0.009969711303710938, 0.010493874549865723, 0.011018037796020508, 0.011542201042175293, 0.012066364288330078, 0.012590527534484863, 0.013114690780639648, 0.013638854026794434, 0.014163017272949219, 0.014687180519104004, 0.015211343765258789, 0.015735507011413574, 0.01625967025756836, 0.016783833503723145, 0.01730799674987793, 0.017832159996032715, 0.0183563232421875]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 44.0, 294.0, 519.0, 136.0, 16.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.308990478515625, -12.782543182373047, -12.256094932556152, -11.729646682739258, -11.20319938659668, -10.676752090454102, -10.150303840637207, -9.623855590820312, -9.097408294677734, -8.570960998535156, -8.044512748718262, -7.518064975738525, -6.991617202758789, -6.465169429779053, -5.938721656799316, -5.41227388381958, -4.885826110839844, -4.359378337860107, -3.832930564880371, -3.3064827919006348, -2.7800350189208984, -2.253587245941162, -1.7271394729614258, -1.2006916999816895, -0.6742439270019531, -0.1477961540222168, 0.37865161895751953, 0.9050993919372559, 1.4315471649169922, 1.9579949378967285, 2.484442710876465, 3.010890483856201, 3.5373382568359375, 4.063786029815674, 4.59023380279541, 5.1166815757751465, 5.643129348754883, 6.169577121734619, 6.6960248947143555, 7.222472667694092, 7.748920440673828, 8.275367736816406, 8.8018159866333, 9.328264236450195, 9.854711532592773, 10.381158828735352, 10.907607078552246, 11.43405532836914, 11.960502624511719, 12.486949920654297, 13.013398170471191, 13.539846420288086, 14.066293716430664, 14.592741012573242, 15.119189262390137, 15.645637512207031, 16.17208480834961, 16.698532104492188, 17.224979400634766, 17.751428604125977, 18.277875900268555, 18.804323196411133, 19.330772399902344, 19.857219696044922, 20.3836669921875]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 5.0, 2.0, 4.0, 4.0, 8.0, 2.0, 16.0, 7.0, 19.0, 23.0, 25.0, 32.0, 31.0, 49.0, 55.0, 54.0, 54.0, 56.0, 50.0, 55.0, 54.0, 57.0, 49.0, 49.0, 46.0, 43.0, 28.0, 22.0, 23.0, 20.0, 21.0, 14.0, 4.0, 10.0, 5.0, 3.0, 6.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2922892570495605, -2.2165064811706543, -2.140723705291748, -2.0649406909942627, -1.9891579151153564, -1.9133751392364502, -1.837592363357544, -1.7618095874786377, -1.686026692390442, -1.6102439165115356, -1.5344610214233398, -1.4586782455444336, -1.3828954696655273, -1.3071125745773315, -1.2313297986984253, -1.1555469036102295, -1.0797641277313232, -1.003981351852417, -0.9281984567642212, -0.8524156808853149, -0.7766328454017639, -0.7008500099182129, -0.6250672340393066, -0.5492843985557556, -0.4735015630722046, -0.39771872758865356, -0.3219359219074249, -0.2461531013250351, -0.17037028074264526, -0.09458744525909424, -0.0188046395778656, 0.05697816610336304, 0.13276100158691406, 0.2085438221693039, 0.2843266427516937, 0.36010944843292236, 0.4358922839164734, 0.5116751194000244, 0.5874578952789307, 0.6632407307624817, 0.7390235662460327, 0.8148064017295837, 0.8905892372131348, 0.966372013092041, 1.0421547889709473, 1.117937684059143, 1.1937204599380493, 1.2695033550262451, 1.3452861309051514, 1.4210689067840576, 1.4968518018722534, 1.5726345777511597, 1.6484174728393555, 1.7242002487182617, 1.799983024597168, 1.8757658004760742, 1.95154869556427, 2.027331590652466, 2.103114366531372, 2.1788971424102783, 2.2546799182891846, 2.33046293258667, 2.406245708465576, 2.4820284843444824, 2.5578112602233887]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 1.0, 1.0, 4.0, 7.0, 5.0, 18.0, 15.0, 21.0, 27.0, 41.0, 65.0, 131.0, 358.0, 1462.0, 11502.0, 188477.0, 725308.0, 112298.0, 7107.0, 1142.0, 267.0, 123.0, 51.0, 47.0, 16.0, 10.0, 13.0, 13.0, 8.0, 4.0, 7.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.23046875, -4.08154296875, -3.9326171875, -3.78369140625, -3.634765625, -3.48583984375, -3.3369140625, -3.18798828125, -3.0390625, -2.89013671875, -2.7412109375, -2.59228515625, -2.443359375, -2.29443359375, -2.1455078125, -1.99658203125, -1.84765625, -1.69873046875, -1.5498046875, -1.40087890625, -1.251953125, -1.10302734375, -0.9541015625, -0.80517578125, -0.65625, -0.50732421875, -0.3583984375, -0.20947265625, -0.060546875, 0.08837890625, 0.2373046875, 0.38623046875, 0.53515625, 0.68408203125, 0.8330078125, 0.98193359375, 1.130859375, 1.27978515625, 1.4287109375, 1.57763671875, 1.7265625, 1.87548828125, 2.0244140625, 2.17333984375, 2.322265625, 2.47119140625, 2.6201171875, 2.76904296875, 2.91796875, 3.06689453125, 3.2158203125, 3.36474609375, 3.513671875, 3.66259765625, 3.8115234375, 3.96044921875, 4.109375, 4.25830078125, 4.4072265625, 4.55615234375, 4.705078125, 4.85400390625, 5.0029296875, 5.15185546875, 5.30078125]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 4.0, 6.0, 3.0, 5.0, 8.0, 10.0, 9.0, 19.0, 19.0, 29.0, 29.0, 40.0, 31.0, 49.0, 55.0, 59.0, 56.0, 67.0, 55.0, 56.0, 49.0, 53.0, 44.0, 54.0, 29.0, 29.0, 25.0, 20.0, 24.0, 12.0, 20.0, 11.0, 13.0, 6.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.8125, -4.667724609375, -4.52294921875, -4.378173828125, -4.2333984375, -4.088623046875, -3.94384765625, -3.799072265625, -3.654296875, -3.509521484375, -3.36474609375, -3.219970703125, -3.0751953125, -2.930419921875, -2.78564453125, -2.640869140625, -2.49609375, -2.351318359375, -2.20654296875, -2.061767578125, -1.9169921875, -1.772216796875, -1.62744140625, -1.482666015625, -1.337890625, -1.193115234375, -1.04833984375, -0.903564453125, -0.7587890625, -0.614013671875, -0.46923828125, -0.324462890625, -0.1796875, -0.034912109375, 0.10986328125, 0.254638671875, 0.3994140625, 0.544189453125, 0.68896484375, 0.833740234375, 0.978515625, 1.123291015625, 1.26806640625, 1.412841796875, 1.5576171875, 1.702392578125, 1.84716796875, 1.991943359375, 2.13671875, 2.281494140625, 2.42626953125, 2.571044921875, 2.7158203125, 2.860595703125, 3.00537109375, 3.150146484375, 3.294921875, 3.439697265625, 3.58447265625, 3.729248046875, 3.8740234375, 4.018798828125, 4.16357421875, 4.308349609375, 4.453125]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 3.0, 3.0, 3.0, 10.0, 9.0, 12.0, 12.0, 18.0, 23.0, 42.0, 56.0, 73.0, 114.0, 138.0, 202.0, 392.0, 1211.0, 10758.0, 410146.0, 605501.0, 16993.0, 1562.0, 451.0, 238.0, 154.0, 125.0, 82.0, 65.0, 52.0, 29.0, 23.0, 18.0, 12.0, 5.0, 3.0, 6.0, 2.0, 3.0, 5.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.13671875, -5.951171875, -5.765625, -5.580078125, -5.39453125, -5.208984375, -5.0234375, -4.837890625, -4.65234375, -4.466796875, -4.28125, -4.095703125, -3.91015625, -3.724609375, -3.5390625, -3.353515625, -3.16796875, -2.982421875, -2.796875, -2.611328125, -2.42578125, -2.240234375, -2.0546875, -1.869140625, -1.68359375, -1.498046875, -1.3125, -1.126953125, -0.94140625, -0.755859375, -0.5703125, -0.384765625, -0.19921875, -0.013671875, 0.171875, 0.357421875, 0.54296875, 0.728515625, 0.9140625, 1.099609375, 1.28515625, 1.470703125, 1.65625, 1.841796875, 2.02734375, 2.212890625, 2.3984375, 2.583984375, 2.76953125, 2.955078125, 3.140625, 3.326171875, 3.51171875, 3.697265625, 3.8828125, 4.068359375, 4.25390625, 4.439453125, 4.625, 4.810546875, 4.99609375, 5.181640625, 5.3671875, 5.552734375, 5.73828125]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 3.0, 6.0, 3.0, 14.0, 5.0, 16.0, 12.0, 28.0, 21.0, 21.0, 39.0, 40.0, 44.0, 47.0, 43.0, 48.0, 51.0, 43.0, 43.0, 60.0, 44.0, 41.0, 39.0, 37.0, 37.0, 35.0, 41.0, 20.0, 30.0, 22.0, 14.0, 14.0, 11.0, 8.0, 5.0, 6.0, 6.0, 3.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.30859375, -5.15606689453125, -5.0035400390625, -4.85101318359375, -4.698486328125, -4.54595947265625, -4.3934326171875, -4.24090576171875, -4.08837890625, -3.93585205078125, -3.7833251953125, -3.63079833984375, -3.478271484375, -3.32574462890625, -3.1732177734375, -3.02069091796875, -2.8681640625, -2.71563720703125, -2.5631103515625, -2.41058349609375, -2.258056640625, -2.10552978515625, -1.9530029296875, -1.80047607421875, -1.64794921875, -1.49542236328125, -1.3428955078125, -1.19036865234375, -1.037841796875, -0.88531494140625, -0.7327880859375, -0.58026123046875, -0.427734375, -0.27520751953125, -0.1226806640625, 0.02984619140625, 0.182373046875, 0.33489990234375, 0.4874267578125, 0.63995361328125, 0.79248046875, 0.94500732421875, 1.0975341796875, 1.25006103515625, 1.402587890625, 1.55511474609375, 1.7076416015625, 1.86016845703125, 2.0126953125, 2.16522216796875, 2.3177490234375, 2.47027587890625, 2.622802734375, 2.77532958984375, 2.9278564453125, 3.08038330078125, 3.23291015625, 3.38543701171875, 3.5379638671875, 3.69049072265625, 3.843017578125, 3.99554443359375, 4.1480712890625, 4.30059814453125, 4.453125]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 10.0, 10.0, 12.0, 19.0, 47.0, 81.0, 225.0, 935.0, 8003.0, 665544.0, 366529.0, 5966.0, 790.0, 200.0, 77.0, 42.0, 29.0, 12.0, 10.0, 4.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6875, -3.5643310546875, -3.441162109375, -3.3179931640625, -3.19482421875, -3.0716552734375, -2.948486328125, -2.8253173828125, -2.7021484375, -2.5789794921875, -2.455810546875, -2.3326416015625, -2.20947265625, -2.0863037109375, -1.963134765625, -1.8399658203125, -1.716796875, -1.5936279296875, -1.470458984375, -1.3472900390625, -1.22412109375, -1.1009521484375, -0.977783203125, -0.8546142578125, -0.7314453125, -0.6082763671875, -0.485107421875, -0.3619384765625, -0.23876953125, -0.1156005859375, 0.007568359375, 0.1307373046875, 0.25390625, 0.3770751953125, 0.500244140625, 0.6234130859375, 0.74658203125, 0.8697509765625, 0.992919921875, 1.1160888671875, 1.2392578125, 1.3624267578125, 1.485595703125, 1.6087646484375, 1.73193359375, 1.8551025390625, 1.978271484375, 2.1014404296875, 2.224609375, 2.3477783203125, 2.470947265625, 2.5941162109375, 2.71728515625, 2.8404541015625, 2.963623046875, 3.0867919921875, 3.2099609375, 3.3331298828125, 3.456298828125, 3.5794677734375, 3.70263671875, 3.8258056640625, 3.948974609375, 4.0721435546875, 4.1953125]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 5.0, 4.0, 3.0, 2.0, 6.0, 8.0, 11.0, 6.0, 13.0, 19.0, 32.0, 28.0, 43.0, 49.0, 57.0, 78.0, 120.0, 96.0, 86.0, 66.0, 58.0, 43.0, 36.0, 31.0, 29.0, 18.0, 16.0, 8.0, 4.0, 8.0, 3.0, 5.0, 0.0, 2.0, 0.0, 2.0, 5.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00018155574798583984, -0.00017639808356761932, -0.0001712404191493988, -0.00016608275473117828, -0.00016092509031295776, -0.00015576742589473724, -0.00015060976147651672, -0.0001454520970582962, -0.00014029443264007568, -0.00013513676822185516, -0.00012997910380363464, -0.00012482143938541412, -0.0001196637749671936, -0.00011450611054897308, -0.00010934844613075256, -0.00010419078171253204, -9.903311729431152e-05, -9.3875452876091e-05, -8.871778845787048e-05, -8.356012403964996e-05, -7.840245962142944e-05, -7.324479520320892e-05, -6.80871307849884e-05, -6.292946636676788e-05, -5.777180194854736e-05, -5.261413753032684e-05, -4.745647311210632e-05, -4.22988086938858e-05, -3.714114427566528e-05, -3.198347985744476e-05, -2.6825815439224243e-05, -2.1668151021003723e-05, -1.6510486602783203e-05, -1.1352822184562683e-05, -6.195157766342163e-06, -1.037493348121643e-06, 4.120171070098877e-06, 9.277835488319397e-06, 1.4435499906539917e-05, 1.9593164324760437e-05, 2.4750828742980957e-05, 2.9908493161201477e-05, 3.5066157579422e-05, 4.022382199764252e-05, 4.538148641586304e-05, 5.053915083408356e-05, 5.569681525230408e-05, 6.08544796705246e-05, 6.601214408874512e-05, 7.116980850696564e-05, 7.632747292518616e-05, 8.148513734340668e-05, 8.66428017616272e-05, 9.180046617984772e-05, 9.695813059806824e-05, 0.00010211579501628876, 0.00010727345943450928, 0.0001124311238527298, 0.00011758878827095032, 0.00012274645268917084, 0.00012790411710739136, 0.00013306178152561188, 0.0001382194459438324, 0.00014337711036205292, 0.00014853477478027344]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 7.0, 13.0, 17.0, 18.0, 29.0, 45.0, 74.0, 160.0, 408.0, 2001.0, 31727.0, 968659.0, 42193.0, 2377.0, 460.0, 174.0, 78.0, 38.0, 33.0, 18.0, 10.0, 6.0, 6.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0703125, -2.95458984375, -2.8388671875, -2.72314453125, -2.607421875, -2.49169921875, -2.3759765625, -2.26025390625, -2.14453125, -2.02880859375, -1.9130859375, -1.79736328125, -1.681640625, -1.56591796875, -1.4501953125, -1.33447265625, -1.21875, -1.10302734375, -0.9873046875, -0.87158203125, -0.755859375, -0.64013671875, -0.5244140625, -0.40869140625, -0.29296875, -0.17724609375, -0.0615234375, 0.05419921875, 0.169921875, 0.28564453125, 0.4013671875, 0.51708984375, 0.6328125, 0.74853515625, 0.8642578125, 0.97998046875, 1.095703125, 1.21142578125, 1.3271484375, 1.44287109375, 1.55859375, 1.67431640625, 1.7900390625, 1.90576171875, 2.021484375, 2.13720703125, 2.2529296875, 2.36865234375, 2.484375, 2.60009765625, 2.7158203125, 2.83154296875, 2.947265625, 3.06298828125, 3.1787109375, 3.29443359375, 3.41015625, 3.52587890625, 3.6416015625, 3.75732421875, 3.873046875, 3.98876953125, 4.1044921875, 4.22021484375, 4.3359375]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 6.0, 8.0, 13.0, 14.0, 18.0, 37.0, 46.0, 68.0, 98.0, 100.0, 120.0, 113.0, 90.0, 89.0, 51.0, 41.0, 30.0, 14.0, 6.0, 12.0, 11.0, 4.0, 6.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.7724609375, -0.7520523071289062, -0.7316436767578125, -0.7112350463867188, -0.690826416015625, -0.6704177856445312, -0.6500091552734375, -0.6296005249023438, -0.60919189453125, -0.5887832641601562, -0.5683746337890625, -0.5479660034179688, -0.527557373046875, -0.5071487426757812, -0.4867401123046875, -0.46633148193359375, -0.4459228515625, -0.42551422119140625, -0.4051055908203125, -0.38469696044921875, -0.364288330078125, -0.34387969970703125, -0.3234710693359375, -0.30306243896484375, -0.28265380859375, -0.26224517822265625, -0.2418365478515625, -0.22142791748046875, -0.201019287109375, -0.18061065673828125, -0.1602020263671875, -0.13979339599609375, -0.119384765625, -0.09897613525390625, -0.0785675048828125, -0.05815887451171875, -0.037750244140625, -0.01734161376953125, 0.0030670166015625, 0.02347564697265625, 0.04388427734375, 0.06429290771484375, 0.0847015380859375, 0.10511016845703125, 0.125518798828125, 0.14592742919921875, 0.1663360595703125, 0.18674468994140625, 0.2071533203125, 0.22756195068359375, 0.2479705810546875, 0.26837921142578125, 0.288787841796875, 0.30919647216796875, 0.3296051025390625, 0.35001373291015625, 0.37042236328125, 0.39083099365234375, 0.4112396240234375, 0.43164825439453125, 0.452056884765625, 0.47246551513671875, 0.4928741455078125, 0.5132827758789062, 0.53369140625]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 2.0, 5.0, 15.0, 23.0, 48.0, 65.0, 108.0, 154.0, 190.0, 151.0, 106.0, 66.0, 33.0, 20.0, 10.0, 8.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.412341117858887, -5.099510669708252, -4.786680221557617, -4.473849773406982, -4.161019325256348, -3.848189115524292, -3.5353589057922363, -3.2225284576416016, -2.909698009490967, -2.596867561340332, -2.2840371131896973, -1.9712069034576416, -1.6583764553070068, -1.345546007156372, -1.0327156782150269, -0.7198853492736816, -0.4070549011230469, -0.09422451257705688, 0.2186058759689331, 0.5314362645149231, 0.8442666530609131, 1.1570971012115479, 1.469927430152893, 1.7827577590942383, 2.095588207244873, 2.408418655395508, 2.7212491035461426, 3.0340793132781982, 3.346909761428833, 3.6597402095794678, 3.9725704193115234, 4.285400867462158, 4.598230361938477, 4.911060810089111, 5.223891258239746, 5.536721706390381, 5.849552154541016, 6.162382125854492, 6.475212574005127, 6.788043022155762, 7.1008734703063965, 7.413703918457031, 7.726534366607666, 8.0393648147583, 8.352194786071777, 8.66502571105957, 8.977855682373047, 9.290685653686523, 9.603516578674316, 9.916346549987793, 10.229177474975586, 10.542007446289062, 10.854838371276855, 11.167668342590332, 11.480499267578125, 11.793329238891602, 12.106159210205078, 12.418989181518555, 12.731820106506348, 13.044650077819824, 13.357481002807617, 13.670310974121094, 13.983141899108887, 14.295971870422363, 14.608802795410156]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 2.0, 3.0, 6.0, 6.0, 3.0, 6.0, 9.0, 6.0, 7.0, 13.0, 13.0, 21.0, 18.0, 15.0, 30.0, 16.0, 27.0, 28.0, 30.0, 31.0, 48.0, 38.0, 39.0, 42.0, 38.0, 36.0, 41.0, 41.0, 31.0, 37.0, 42.0, 28.0, 31.0, 34.0, 26.0, 25.0, 16.0, 28.0, 21.0, 13.0, 10.0, 8.0, 12.0, 12.0, 4.0, 5.0, 4.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0], "bins": [-6.989990234375, -6.780808448791504, -6.571626663208008, -6.362444877624512, -6.153263092041016, -5.9440813064575195, -5.734899520874023, -5.525717735290527, -5.316535949707031, -5.107354164123535, -4.898172378540039, -4.688990592956543, -4.479808807373047, -4.270627021789551, -4.061445236206055, -3.8522634506225586, -3.6430819034576416, -3.4339001178741455, -3.2247183322906494, -3.0155365467071533, -2.8063547611236572, -2.5971732139587402, -2.387991428375244, -2.178809642791748, -1.9696277379989624, -1.7604459524154663, -1.5512641668319702, -1.3420825004577637, -1.1329007148742676, -0.9237189292907715, -0.7145371437072754, -0.5053553581237793, -0.2961735725402832, -0.0869918018579483, 0.1221899688243866, 0.3313717246055603, 0.5405535101890564, 0.7497352361679077, 0.9589170217514038, 1.1680988073349, 1.377280592918396, 1.586462378501892, 1.7956441640853882, 2.0048258304595947, 2.214007616043091, 2.423189401626587, 2.632371187210083, 2.841552972793579, 3.050734758377075, 3.2599165439605713, 3.4690983295440674, 3.6782801151275635, 3.8874619007110596, 4.096643447875977, 4.305825233459473, 4.515007019042969, 4.724188804626465, 4.933370590209961, 5.142552375793457, 5.351734161376953, 5.560915946960449, 5.770097732543945, 5.979279518127441, 6.1884613037109375, 6.397643089294434]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 8.0, 15.0, 18.0, 28.0, 56.0, 83.0, 145.0, 291.0, 500.0, 1473.0, 14835.0, 1133063.0, 2995897.0, 44668.0, 2202.0, 524.0, 200.0, 94.0, 65.0, 39.0, 26.0, 16.0, 11.0, 8.0, 6.0, 5.0, 7.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.8984375, -6.6241455078125, -6.349853515625, -6.0755615234375, -5.80126953125, -5.5269775390625, -5.252685546875, -4.9783935546875, -4.7041015625, -4.4298095703125, -4.155517578125, -3.8812255859375, -3.60693359375, -3.3326416015625, -3.058349609375, -2.7840576171875, -2.509765625, -2.2354736328125, -1.961181640625, -1.6868896484375, -1.41259765625, -1.1383056640625, -0.864013671875, -0.5897216796875, -0.3154296875, -0.0411376953125, 0.233154296875, 0.5074462890625, 0.78173828125, 1.0560302734375, 1.330322265625, 1.6046142578125, 1.87890625, 2.1531982421875, 2.427490234375, 2.7017822265625, 2.97607421875, 3.2503662109375, 3.524658203125, 3.7989501953125, 4.0732421875, 4.3475341796875, 4.621826171875, 4.8961181640625, 5.17041015625, 5.4447021484375, 5.718994140625, 5.9932861328125, 6.267578125, 6.5418701171875, 6.816162109375, 7.0904541015625, 7.36474609375, 7.6390380859375, 7.913330078125, 8.1876220703125, 8.4619140625, 8.7362060546875, 9.010498046875, 9.2847900390625, 9.55908203125, 9.8333740234375, 10.107666015625, 10.3819580078125, 10.65625]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 4.0, 2.0, 4.0, 2.0, 4.0, 5.0, 7.0, 14.0, 19.0, 24.0, 28.0, 38.0, 25.0, 41.0, 49.0, 42.0, 59.0, 54.0, 61.0, 48.0, 48.0, 51.0, 52.0, 56.0, 38.0, 34.0, 29.0, 36.0, 15.0, 19.0, 23.0, 19.0, 14.0, 10.0, 12.0, 4.0, 5.0, 3.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.544921875, -2.45587158203125, -2.3668212890625, -2.27777099609375, -2.188720703125, -2.09967041015625, -2.0106201171875, -1.92156982421875, -1.83251953125, -1.74346923828125, -1.6544189453125, -1.56536865234375, -1.476318359375, -1.38726806640625, -1.2982177734375, -1.20916748046875, -1.1201171875, -1.03106689453125, -0.9420166015625, -0.85296630859375, -0.763916015625, -0.67486572265625, -0.5858154296875, -0.49676513671875, -0.40771484375, -0.31866455078125, -0.2296142578125, -0.14056396484375, -0.051513671875, 0.03753662109375, 0.1265869140625, 0.21563720703125, 0.3046875, 0.39373779296875, 0.4827880859375, 0.57183837890625, 0.660888671875, 0.74993896484375, 0.8389892578125, 0.92803955078125, 1.01708984375, 1.10614013671875, 1.1951904296875, 1.28424072265625, 1.373291015625, 1.46234130859375, 1.5513916015625, 1.64044189453125, 1.7294921875, 1.81854248046875, 1.9075927734375, 1.99664306640625, 2.085693359375, 2.17474365234375, 2.2637939453125, 2.35284423828125, 2.44189453125, 2.53094482421875, 2.6199951171875, 2.70904541015625, 2.798095703125, 2.88714599609375, 2.9761962890625, 3.06524658203125, 3.154296875]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 9.0, 5.0, 14.0, 9.0, 22.0, 31.0, 25.0, 44.0, 50.0, 98.0, 135.0, 197.0, 319.0, 496.0, 895.0, 1688.0, 3818.0, 11549.0, 49492.0, 321199.0, 2373076.0, 1243765.0, 146760.0, 27102.0, 7353.0, 2785.0, 1359.0, 692.0, 448.0, 243.0, 180.0, 109.0, 88.0, 58.0, 50.0, 39.0, 28.0, 12.0, 8.0, 11.0, 8.0, 5.0, 3.0, 0.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.865234375, -2.775146484375, -2.68505859375, -2.594970703125, -2.5048828125, -2.414794921875, -2.32470703125, -2.234619140625, -2.14453125, -2.054443359375, -1.96435546875, -1.874267578125, -1.7841796875, -1.694091796875, -1.60400390625, -1.513916015625, -1.423828125, -1.333740234375, -1.24365234375, -1.153564453125, -1.0634765625, -0.973388671875, -0.88330078125, -0.793212890625, -0.703125, -0.613037109375, -0.52294921875, -0.432861328125, -0.3427734375, -0.252685546875, -0.16259765625, -0.072509765625, 0.017578125, 0.107666015625, 0.19775390625, 0.287841796875, 0.3779296875, 0.468017578125, 0.55810546875, 0.648193359375, 0.73828125, 0.828369140625, 0.91845703125, 1.008544921875, 1.0986328125, 1.188720703125, 1.27880859375, 1.368896484375, 1.458984375, 1.549072265625, 1.63916015625, 1.729248046875, 1.8193359375, 1.909423828125, 1.99951171875, 2.089599609375, 2.1796875, 2.269775390625, 2.35986328125, 2.449951171875, 2.5400390625, 2.630126953125, 2.72021484375, 2.810302734375, 2.900390625]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 6.0, 8.0, 9.0, 12.0, 27.0, 30.0, 50.0, 39.0, 66.0, 95.0, 125.0, 181.0, 251.0, 330.0, 407.0, 491.0, 477.0, 396.0, 293.0, 225.0, 164.0, 109.0, 81.0, 66.0, 36.0, 27.0, 13.0, 21.0, 6.0, 15.0, 7.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.94970703125, -0.9188613891601562, -0.8880157470703125, -0.8571701049804688, -0.826324462890625, -0.7954788208007812, -0.7646331787109375, -0.7337875366210938, -0.70294189453125, -0.6720962524414062, -0.6412506103515625, -0.6104049682617188, -0.579559326171875, -0.5487136840820312, -0.5178680419921875, -0.48702239990234375, -0.4561767578125, -0.42533111572265625, -0.3944854736328125, -0.36363983154296875, -0.332794189453125, -0.30194854736328125, -0.2711029052734375, -0.24025726318359375, -0.20941162109375, -0.17856597900390625, -0.1477203369140625, -0.11687469482421875, -0.086029052734375, -0.05518341064453125, -0.0243377685546875, 0.00650787353515625, 0.037353515625, 0.06819915771484375, 0.0990447998046875, 0.12989044189453125, 0.160736083984375, 0.19158172607421875, 0.2224273681640625, 0.25327301025390625, 0.28411865234375, 0.31496429443359375, 0.3458099365234375, 0.37665557861328125, 0.407501220703125, 0.43834686279296875, 0.4691925048828125, 0.5000381469726562, 0.5308837890625, 0.5617294311523438, 0.5925750732421875, 0.6234207153320312, 0.654266357421875, 0.6851119995117188, 0.7159576416015625, 0.7468032836914062, 0.77764892578125, 0.8084945678710938, 0.8393402099609375, 0.8701858520507812, 0.901031494140625, 0.9318771362304688, 0.9627227783203125, 0.9935684204101562, 1.0244140625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 1.0, 3.0, 4.0, 6.0, 10.0, 12.0, 23.0, 48.0, 40.0, 78.0, 95.0, 116.0, 106.0, 123.0, 92.0, 75.0, 59.0, 45.0, 33.0, 17.0, 10.0, 4.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6815876960754395, -4.513382911682129, -4.345178604125977, -4.176973819732666, -4.0087690353393555, -3.840564727783203, -3.6723599433898926, -3.504155397415161, -3.3359508514404297, -3.1677463054656982, -2.999541759490967, -2.8313369750976562, -2.663132429122925, -2.4949278831481934, -2.326723098754883, -2.1585185527801514, -1.99031400680542, -1.8221094608306885, -1.6539047956466675, -1.4857001304626465, -1.317495584487915, -1.1492910385131836, -0.9810863733291626, -0.8128817081451416, -0.6446771621704102, -0.47647255659103394, -0.3082679510116577, -0.1400633454322815, 0.028141260147094727, 0.19634586572647095, 0.36455047130584717, 0.5327551364898682, 0.7009592056274414, 0.8691638112068176, 1.0373684167861938, 1.2055730819702148, 1.3737776279449463, 1.5419821739196777, 1.7101868391036987, 1.8783915042877197, 2.046596050262451, 2.2148005962371826, 2.383005142211914, 2.5512099266052246, 2.719414472579956, 2.8876190185546875, 3.055823802947998, 3.2240283489227295, 3.392232894897461, 3.5604374408721924, 3.728641986846924, 3.8968467712402344, 4.065051078796387, 4.233255863189697, 4.401460647583008, 4.56966495513916, 4.737869739532471, 4.906074523925781, 5.074278831481934, 5.242483615875244, 5.410688400268555, 5.578892707824707, 5.747097492218018, 5.915302276611328, 6.0835065841674805]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 7.0, 4.0, 4.0, 9.0, 13.0, 16.0, 21.0, 18.0, 15.0, 24.0, 40.0, 42.0, 35.0, 32.0, 52.0, 45.0, 42.0, 49.0, 57.0, 43.0, 43.0, 45.0, 39.0, 29.0, 39.0, 32.0, 30.0, 29.0, 22.0, 26.0, 20.0, 12.0, 16.0, 12.0, 11.0, 10.0, 3.0, 6.0, 6.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1871447563171387, -2.0993478298187256, -2.0115509033203125, -1.9237537384033203, -1.8359568119049072, -1.7481598854064941, -1.6603628396987915, -1.5725657939910889, -1.4847688674926758, -1.3969719409942627, -1.30917489528656, -1.2213778495788574, -1.1335809230804443, -1.0457839965820312, -0.9579869508743286, -0.8701899647712708, -0.7823929786682129, -0.694595992565155, -0.6067990064620972, -0.5190020203590393, -0.43120503425598145, -0.3434080481529236, -0.2556110620498657, -0.16781407594680786, -0.08001708984375, 0.007779896259307861, 0.09557688236236572, 0.18337386846542358, 0.27117085456848145, 0.3589678406715393, 0.44676482677459717, 0.534561812877655, 0.6223587989807129, 0.7101557850837708, 0.7979527711868286, 0.8857497572898865, 0.9735467433929443, 1.0613436698913574, 1.14914071559906, 1.2369377613067627, 1.3247346878051758, 1.4125316143035889, 1.5003286600112915, 1.5881257057189941, 1.6759226322174072, 1.7637195587158203, 1.851516604423523, 1.9393136501312256, 2.0271105766296387, 2.1149075031280518, 2.202704429626465, 2.290501594543457, 2.37829852104187, 2.466095447540283, 2.5538926124572754, 2.6416895389556885, 2.7294864654541016, 2.8172833919525146, 2.9050803184509277, 2.99287748336792, 3.080674409866333, 3.168471336364746, 3.2562685012817383, 3.3440654277801514, 3.4318623542785645]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 5.0, 4.0, 2.0, 2.0, 3.0, 9.0, 12.0, 10.0, 18.0, 45.0, 42.0, 72.0, 127.0, 187.0, 299.0, 475.0, 782.0, 1386.0, 2585.0, 4755.0, 8998.0, 17310.0, 34162.0, 69057.0, 134523.0, 222737.0, 236295.0, 152690.0, 79492.0, 39834.0, 20090.0, 10338.0, 5382.0, 2840.0, 1616.0, 959.0, 547.0, 360.0, 169.0, 124.0, 65.0, 54.0, 33.0, 21.0, 12.0, 8.0, 11.0, 10.0, 1.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.29833984375, -0.2880897521972656, -0.27783966064453125, -0.2675895690917969, -0.2573394775390625, -0.24708938598632812, -0.23683929443359375, -0.22658920288085938, -0.216339111328125, -0.20608901977539062, -0.19583892822265625, -0.18558883666992188, -0.1753387451171875, -0.16508865356445312, -0.15483856201171875, -0.14458847045898438, -0.13433837890625, -0.12408828735351562, -0.11383819580078125, -0.10358810424804688, -0.0933380126953125, -0.08308792114257812, -0.07283782958984375, -0.06258773803710938, -0.052337646484375, -0.042087554931640625, -0.03183746337890625, -0.021587371826171875, -0.0113372802734375, -0.001087188720703125, 0.00916290283203125, 0.019412994384765625, 0.0296630859375, 0.039913177490234375, 0.05016326904296875, 0.060413360595703125, 0.0706634521484375, 0.08091354370117188, 0.09116363525390625, 0.10141372680664062, 0.111663818359375, 0.12191390991210938, 0.13216400146484375, 0.14241409301757812, 0.1526641845703125, 0.16291427612304688, 0.17316436767578125, 0.18341445922851562, 0.19366455078125, 0.20391464233398438, 0.21416473388671875, 0.22441482543945312, 0.2346649169921875, 0.24491500854492188, 0.25516510009765625, 0.2654151916503906, 0.275665283203125, 0.2859153747558594, 0.29616546630859375, 0.3064155578613281, 0.3166656494140625, 0.3269157409667969, 0.33716583251953125, 0.3474159240722656, 0.357666015625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 7.0, 10.0, 5.0, 10.0, 18.0, 14.0, 23.0, 29.0, 32.0, 39.0, 50.0, 51.0, 54.0, 61.0, 46.0, 75.0, 52.0, 61.0, 54.0, 49.0, 42.0, 41.0, 34.0, 34.0, 19.0, 27.0, 21.0, 8.0, 11.0, 7.0, 7.0, 4.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.05078125, -1.977020263671875, -1.90325927734375, -1.829498291015625, -1.7557373046875, -1.681976318359375, -1.60821533203125, -1.534454345703125, -1.460693359375, -1.386932373046875, -1.31317138671875, -1.239410400390625, -1.1656494140625, -1.091888427734375, -1.01812744140625, -0.944366455078125, -0.87060546875, -0.796844482421875, -0.72308349609375, -0.649322509765625, -0.5755615234375, -0.501800537109375, -0.42803955078125, -0.354278564453125, -0.280517578125, -0.206756591796875, -0.13299560546875, -0.059234619140625, 0.0145263671875, 0.088287353515625, 0.16204833984375, 0.235809326171875, 0.3095703125, 0.383331298828125, 0.45709228515625, 0.530853271484375, 0.6046142578125, 0.678375244140625, 0.75213623046875, 0.825897216796875, 0.899658203125, 0.973419189453125, 1.04718017578125, 1.120941162109375, 1.1947021484375, 1.268463134765625, 1.34222412109375, 1.415985107421875, 1.48974609375, 1.563507080078125, 1.63726806640625, 1.711029052734375, 1.7847900390625, 1.858551025390625, 1.93231201171875, 2.006072998046875, 2.079833984375, 2.153594970703125, 2.22735595703125, 2.301116943359375, 2.3748779296875, 2.448638916015625, 2.52239990234375, 2.596160888671875, 2.669921875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 4.0, 7.0, 13.0, 11.0, 27.0, 33.0, 37.0, 55.0, 116.0, 181.0, 253.0, 350.0, 578.0, 924.0, 1468.0, 2286.0, 3756.0, 6067.0, 9921.0, 16653.0, 28144.0, 47509.0, 78949.0, 126556.0, 179745.0, 187269.0, 138586.0, 88279.0, 52505.0, 31036.0, 18509.0, 11112.0, 6808.0, 4083.0, 2488.0, 1575.0, 916.0, 600.0, 411.0, 259.0, 156.0, 113.0, 79.0, 42.0, 35.0, 23.0, 16.0, 9.0, 2.0, 6.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.19921875, -0.19237518310546875, -0.1855316162109375, -0.17868804931640625, -0.171844482421875, -0.16500091552734375, -0.1581573486328125, -0.15131378173828125, -0.14447021484375, -0.13762664794921875, -0.1307830810546875, -0.12393951416015625, -0.117095947265625, -0.11025238037109375, -0.1034088134765625, -0.09656524658203125, -0.0897216796875, -0.08287811279296875, -0.0760345458984375, -0.06919097900390625, -0.062347412109375, -0.05550384521484375, -0.0486602783203125, -0.04181671142578125, -0.03497314453125, -0.02812957763671875, -0.0212860107421875, -0.01444244384765625, -0.007598876953125, -0.00075531005859375, 0.0060882568359375, 0.01293182373046875, 0.019775390625, 0.02661895751953125, 0.0334625244140625, 0.04030609130859375, 0.047149658203125, 0.05399322509765625, 0.0608367919921875, 0.06768035888671875, 0.07452392578125, 0.08136749267578125, 0.0882110595703125, 0.09505462646484375, 0.101898193359375, 0.10874176025390625, 0.1155853271484375, 0.12242889404296875, 0.1292724609375, 0.13611602783203125, 0.1429595947265625, 0.14980316162109375, 0.156646728515625, 0.16349029541015625, 0.1703338623046875, 0.17717742919921875, 0.18402099609375, 0.19086456298828125, 0.1977081298828125, 0.20455169677734375, 0.211395263671875, 0.21823883056640625, 0.2250823974609375, 0.23192596435546875, 0.23876953125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 5.0, 1.0, 8.0, 7.0, 3.0, 10.0, 11.0, 17.0, 12.0, 18.0, 12.0, 22.0, 27.0, 22.0, 39.0, 45.0, 35.0, 52.0, 59.0, 65.0, 52.0, 47.0, 58.0, 61.0, 45.0, 39.0, 34.0, 31.0, 23.0, 25.0, 22.0, 19.0, 15.0, 16.0, 16.0, 12.0, 4.0, 6.0, 2.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.66015625, -3.5379638671875, -3.415771484375, -3.2935791015625, -3.17138671875, -3.0491943359375, -2.927001953125, -2.8048095703125, -2.6826171875, -2.5604248046875, -2.438232421875, -2.3160400390625, -2.19384765625, -2.0716552734375, -1.949462890625, -1.8272705078125, -1.705078125, -1.5828857421875, -1.460693359375, -1.3385009765625, -1.21630859375, -1.0941162109375, -0.971923828125, -0.8497314453125, -0.7275390625, -0.6053466796875, -0.483154296875, -0.3609619140625, -0.23876953125, -0.1165771484375, 0.005615234375, 0.1278076171875, 0.25, 0.3721923828125, 0.494384765625, 0.6165771484375, 0.73876953125, 0.8609619140625, 0.983154296875, 1.1053466796875, 1.2275390625, 1.3497314453125, 1.471923828125, 1.5941162109375, 1.71630859375, 1.8385009765625, 1.960693359375, 2.0828857421875, 2.205078125, 2.3272705078125, 2.449462890625, 2.5716552734375, 2.69384765625, 2.8160400390625, 2.938232421875, 3.0604248046875, 3.1826171875, 3.3048095703125, 3.427001953125, 3.5491943359375, 3.67138671875, 3.7935791015625, 3.915771484375, 4.0379638671875, 4.16015625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 3.0, 6.0, 11.0, 12.0, 14.0, 17.0, 21.0, 42.0, 67.0, 86.0, 111.0, 166.0, 263.0, 359.0, 556.0, 879.0, 1551.0, 2697.0, 5497.0, 11883.0, 29287.0, 72777.0, 192802.0, 373907.0, 215857.0, 80788.0, 32216.0, 13543.0, 6032.0, 2893.0, 1567.0, 913.0, 563.0, 358.0, 261.0, 163.0, 117.0, 77.0, 64.0, 44.0, 30.0, 16.0, 14.0, 7.0, 7.0, 3.0, 3.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 4.0], "bins": [-0.041748046875, -0.04050397872924805, -0.039259910583496094, -0.03801584243774414, -0.03677177429199219, -0.035527706146240234, -0.03428363800048828, -0.03303956985473633, -0.031795501708984375, -0.030551433563232422, -0.02930736541748047, -0.028063297271728516, -0.026819229125976562, -0.02557516098022461, -0.024331092834472656, -0.023087024688720703, -0.02184295654296875, -0.020598888397216797, -0.019354820251464844, -0.01811075210571289, -0.016866683959960938, -0.015622615814208984, -0.014378547668457031, -0.013134479522705078, -0.011890411376953125, -0.010646343231201172, -0.009402275085449219, -0.008158206939697266, -0.0069141387939453125, -0.005670070648193359, -0.004426002502441406, -0.003181934356689453, -0.0019378662109375, -0.0006937980651855469, 0.0005502700805664062, 0.0017943382263183594, 0.0030384063720703125, 0.004282474517822266, 0.005526542663574219, 0.006770610809326172, 0.008014678955078125, 0.009258747100830078, 0.010502815246582031, 0.011746883392333984, 0.012990951538085938, 0.01423501968383789, 0.015479087829589844, 0.016723155975341797, 0.01796722412109375, 0.019211292266845703, 0.020455360412597656, 0.02169942855834961, 0.022943496704101562, 0.024187564849853516, 0.02543163299560547, 0.026675701141357422, 0.027919769287109375, 0.029163837432861328, 0.03040790557861328, 0.031651973724365234, 0.03289604187011719, 0.03414011001586914, 0.035384178161621094, 0.03662824630737305, 0.037872314453125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 4.0, 7.0, 8.0, 11.0, 18.0, 27.0, 43.0, 70.0, 82.0, 105.0, 127.0, 126.0, 106.0, 63.0, 62.0, 41.0, 33.0, 21.0, 14.0, 15.0, 6.0, 5.0, 6.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.441904067993164e-05, -5.2912160754203796e-05, -5.140528082847595e-05, -4.989840090274811e-05, -4.8391520977020264e-05, -4.688464105129242e-05, -4.5377761125564575e-05, -4.387088119983673e-05, -4.236400127410889e-05, -4.085712134838104e-05, -3.93502414226532e-05, -3.7843361496925354e-05, -3.633648157119751e-05, -3.4829601645469666e-05, -3.332272171974182e-05, -3.181584179401398e-05, -3.0308961868286133e-05, -2.880208194255829e-05, -2.7295202016830444e-05, -2.57883220911026e-05, -2.4281442165374756e-05, -2.277456223964691e-05, -2.1267682313919067e-05, -1.9760802388191223e-05, -1.825392246246338e-05, -1.6747042536735535e-05, -1.524016261100769e-05, -1.3733282685279846e-05, -1.2226402759552002e-05, -1.0719522833824158e-05, -9.212642908096313e-06, -7.70576298236847e-06, -6.198883056640625e-06, -4.692003130912781e-06, -3.1851232051849365e-06, -1.6782432794570923e-06, -1.7136335372924805e-07, 1.3355165719985962e-06, 2.8423964977264404e-06, 4.349276423454285e-06, 5.856156349182129e-06, 7.363036274909973e-06, 8.869916200637817e-06, 1.0376796126365662e-05, 1.1883676052093506e-05, 1.339055597782135e-05, 1.4897435903549194e-05, 1.640431582927704e-05, 1.7911195755004883e-05, 1.9418075680732727e-05, 2.092495560646057e-05, 2.2431835532188416e-05, 2.393871545791626e-05, 2.5445595383644104e-05, 2.6952475309371948e-05, 2.8459355235099792e-05, 2.9966235160827637e-05, 3.147311508655548e-05, 3.2979995012283325e-05, 3.448687493801117e-05, 3.5993754863739014e-05, 3.750063478946686e-05, 3.90075147151947e-05, 4.0514394640922546e-05, 4.202127456665039e-05]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 6.0, 12.0, 10.0, 10.0, 26.0, 24.0, 46.0, 54.0, 61.0, 94.0, 155.0, 298.0, 532.0, 1248.0, 3007.0, 8031.0, 23491.0, 72940.0, 241580.0, 430138.0, 182529.0, 55249.0, 18095.0, 6366.0, 2380.0, 1011.0, 494.0, 230.0, 135.0, 106.0, 51.0, 38.0, 33.0, 19.0, 19.0, 10.0, 8.0, 7.0, 6.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.052001953125, -0.05048942565917969, -0.048976898193359375, -0.04746437072753906, -0.04595184326171875, -0.04443931579589844, -0.042926788330078125, -0.04141426086425781, -0.0399017333984375, -0.03838920593261719, -0.036876678466796875, -0.03536415100097656, -0.03385162353515625, -0.03233909606933594, -0.030826568603515625, -0.029314041137695312, -0.027801513671875, -0.026288986206054688, -0.024776458740234375, -0.023263931274414062, -0.02175140380859375, -0.020238876342773438, -0.018726348876953125, -0.017213821411132812, -0.0157012939453125, -0.014188766479492188, -0.012676239013671875, -0.011163711547851562, -0.00965118408203125, -0.008138656616210938, -0.006626129150390625, -0.0051136016845703125, -0.00360107421875, -0.0020885467529296875, -0.000576019287109375, 0.0009365081787109375, 0.00244903564453125, 0.0039615631103515625, 0.005474090576171875, 0.0069866180419921875, 0.0084991455078125, 0.010011672973632812, 0.011524200439453125, 0.013036727905273438, 0.01454925537109375, 0.016061782836914062, 0.017574310302734375, 0.019086837768554688, 0.020599365234375, 0.022111892700195312, 0.023624420166015625, 0.025136947631835938, 0.02664947509765625, 0.028162002563476562, 0.029674530029296875, 0.031187057495117188, 0.0326995849609375, 0.03421211242675781, 0.035724639892578125, 0.03723716735839844, 0.03874969482421875, 0.04026222229003906, 0.041774749755859375, 0.04328727722167969, 0.0447998046875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 6.0, 5.0, 8.0, 10.0, 8.0, 9.0, 17.0, 10.0, 17.0, 14.0, 23.0, 22.0, 29.0, 40.0, 47.0, 59.0, 71.0, 75.0, 87.0, 73.0, 72.0, 49.0, 39.0, 39.0, 22.0, 33.0, 13.0, 18.0, 18.0, 13.0, 8.0, 9.0, 15.0, 6.0, 5.0, 2.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01336669921875, -0.012975931167602539, -0.012585163116455078, -0.012194395065307617, -0.011803627014160156, -0.011412858963012695, -0.011022090911865234, -0.010631322860717773, -0.010240554809570312, -0.009849786758422852, -0.00945901870727539, -0.00906825065612793, -0.008677482604980469, -0.008286714553833008, -0.007895946502685547, -0.007505178451538086, -0.007114410400390625, -0.006723642349243164, -0.006332874298095703, -0.005942106246948242, -0.005551338195800781, -0.00516057014465332, -0.004769802093505859, -0.0043790340423583984, -0.0039882659912109375, -0.0035974979400634766, -0.0032067298889160156, -0.0028159618377685547, -0.0024251937866210938, -0.002034425735473633, -0.0016436576843261719, -0.001252889633178711, -0.00086212158203125, -0.00047135353088378906, -8.058547973632812e-05, 0.0003101825714111328, 0.0007009506225585938, 0.0010917186737060547, 0.0014824867248535156, 0.0018732547760009766, 0.0022640228271484375, 0.0026547908782958984, 0.0030455589294433594, 0.0034363269805908203, 0.0038270950317382812, 0.004217863082885742, 0.004608631134033203, 0.004999399185180664, 0.005390167236328125, 0.005780935287475586, 0.006171703338623047, 0.006562471389770508, 0.006953239440917969, 0.00734400749206543, 0.007734775543212891, 0.008125543594360352, 0.008516311645507812, 0.008907079696655273, 0.009297847747802734, 0.009688615798950195, 0.010079383850097656, 0.010470151901245117, 0.010860919952392578, 0.011251688003540039, 0.0116424560546875]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 22.0, 75.0, 207.0, 344.0, 229.0, 98.0, 27.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.285140991210938, -7.9953107833862305, -7.705480098724365, -7.4156494140625, -7.125819206237793, -6.835988998413086, -6.546158313751221, -6.2563276290893555, -5.966497421264648, -5.676667213439941, -5.386836528778076, -5.097005844116211, -4.807175636291504, -4.517345428466797, -4.227514743804932, -3.9376842975616455, -3.6478538513183594, -3.3580234050750732, -3.068192958831787, -2.778362512588501, -2.488532066345215, -2.1987016201019287, -1.9088711738586426, -1.6190407276153564, -1.3292102813720703, -1.0393798351287842, -0.749549388885498, -0.4597189426422119, -0.16988849639892578, 0.11994194984436035, 0.4097723960876465, 0.6996028423309326, 0.9894332885742188, 1.2792637348175049, 1.569094181060791, 1.8589246273040771, 2.1487550735473633, 2.4385855197906494, 2.7284159660339355, 3.0182464122772217, 3.308076858520508, 3.597907304763794, 3.88773775100708, 4.177568435668945, 4.467398643493652, 4.757228851318359, 5.047059535980225, 5.33689022064209, 5.626720428466797, 5.916550636291504, 6.206381320953369, 6.496212005615234, 6.786042213439941, 7.075872421264648, 7.365703105926514, 7.655533790588379, 7.945363998413086, 8.235194206237793, 8.5250244140625, 8.814855575561523, 9.10468578338623, 9.394515991210938, 9.684347152709961, 9.974177360534668, 10.264007568359375]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 5.0, 6.0, 6.0, 4.0, 8.0, 15.0, 10.0, 22.0, 26.0, 27.0, 35.0, 39.0, 57.0, 50.0, 61.0, 61.0, 69.0, 62.0, 54.0, 60.0, 43.0, 48.0, 42.0, 36.0, 25.0, 29.0, 30.0, 19.0, 15.0, 13.0, 13.0, 7.0, 4.0, 6.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.75247061252594, -1.680452585220337, -1.6084344387054443, -1.5364164113998413, -1.4643983840942383, -1.3923802375793457, -1.3203622102737427, -1.2483441829681396, -1.176326036453247, -1.104308009147644, -1.0322898626327515, -0.9602718353271484, -0.8882537484169006, -0.8162356615066528, -0.7442176342010498, -0.672199547290802, -0.6001814603805542, -0.5281633734703064, -0.456145316362381, -0.38412725925445557, -0.31210917234420776, -0.24009108543395996, -0.16807302832603455, -0.09605497121810913, -0.024036884307861328, 0.04798118770122528, 0.11999925971031189, 0.1920173317193985, 0.2640354037284851, 0.3360534906387329, 0.4080715477466583, 0.48008960485458374, 0.552107572555542, 0.6241256594657898, 0.6961437463760376, 0.7681617736816406, 0.8401798605918884, 0.9121979475021362, 0.9842159748077393, 1.0562341213226318, 1.1282521486282349, 1.200270175933838, 1.2722883224487305, 1.3443063497543335, 1.4163243770599365, 1.488342523574829, 1.5603605508804321, 1.6323785781860352, 1.7043967247009277, 1.7764147520065308, 1.8484328985214233, 1.9204509258270264, 1.992469072341919, 2.0644869804382324, 2.136505126953125, 2.2085232734680176, 2.28054141998291, 2.3525595664978027, 2.424577474594116, 2.496595621109009, 2.5686137676239014, 2.640631675720215, 2.7126498222351074, 2.78466796875, 2.8566858768463135]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 5.0, 5.0, 5.0, 8.0, 14.0, 10.0, 18.0, 21.0, 31.0, 37.0, 70.0, 112.0, 163.0, 301.0, 477.0, 845.0, 1679.0, 2996.0, 6544.0, 13119.0, 28816.0, 64778.0, 151884.0, 291144.0, 262220.0, 124225.0, 52830.0, 23681.0, 11123.0, 5420.0, 2640.0, 1433.0, 794.0, 401.0, 245.0, 163.0, 88.0, 68.0, 38.0, 28.0, 22.0, 16.0, 8.0, 6.0, 7.0, 9.0, 6.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-1.38671875, -1.3418121337890625, -1.296905517578125, -1.2519989013671875, -1.20709228515625, -1.1621856689453125, -1.117279052734375, -1.0723724365234375, -1.0274658203125, -0.9825592041015625, -0.937652587890625, -0.8927459716796875, -0.84783935546875, -0.8029327392578125, -0.758026123046875, -0.7131195068359375, -0.668212890625, -0.6233062744140625, -0.578399658203125, -0.5334930419921875, -0.48858642578125, -0.4436798095703125, -0.398773193359375, -0.3538665771484375, -0.3089599609375, -0.2640533447265625, -0.219146728515625, -0.1742401123046875, -0.12933349609375, -0.0844268798828125, -0.039520263671875, 0.0053863525390625, 0.05029296875, 0.0951995849609375, 0.140106201171875, 0.1850128173828125, 0.22991943359375, 0.2748260498046875, 0.319732666015625, 0.3646392822265625, 0.4095458984375, 0.4544525146484375, 0.499359130859375, 0.5442657470703125, 0.58917236328125, 0.6340789794921875, 0.678985595703125, 0.7238922119140625, 0.768798828125, 0.8137054443359375, 0.858612060546875, 0.9035186767578125, 0.94842529296875, 0.9933319091796875, 1.038238525390625, 1.0831451416015625, 1.1280517578125, 1.1729583740234375, 1.217864990234375, 1.2627716064453125, 1.30767822265625, 1.3525848388671875, 1.397491455078125, 1.4423980712890625, 1.4873046875]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 2.0, 3.0, 4.0, 3.0, 4.0, 3.0, 6.0, 8.0, 11.0, 15.0, 17.0, 17.0, 20.0, 26.0, 35.0, 29.0, 42.0, 51.0, 49.0, 33.0, 47.0, 54.0, 62.0, 52.0, 56.0, 38.0, 45.0, 40.0, 33.0, 33.0, 33.0, 29.0, 21.0, 17.0, 19.0, 14.0, 6.0, 11.0, 8.0, 5.0, 4.0, 3.0, 1.0, 1.0, 6.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.154296875, -3.035369873046875, -2.91644287109375, -2.797515869140625, -2.6785888671875, -2.559661865234375, -2.44073486328125, -2.321807861328125, -2.202880859375, -2.083953857421875, -1.96502685546875, -1.846099853515625, -1.7271728515625, -1.608245849609375, -1.48931884765625, -1.370391845703125, -1.25146484375, -1.132537841796875, -1.01361083984375, -0.894683837890625, -0.7757568359375, -0.656829833984375, -0.53790283203125, -0.418975830078125, -0.300048828125, -0.181121826171875, -0.06219482421875, 0.056732177734375, 0.1756591796875, 0.294586181640625, 0.41351318359375, 0.532440185546875, 0.6513671875, 0.770294189453125, 0.88922119140625, 1.008148193359375, 1.1270751953125, 1.246002197265625, 1.36492919921875, 1.483856201171875, 1.602783203125, 1.721710205078125, 1.84063720703125, 1.959564208984375, 2.0784912109375, 2.197418212890625, 2.31634521484375, 2.435272216796875, 2.55419921875, 2.673126220703125, 2.79205322265625, 2.910980224609375, 3.0299072265625, 3.148834228515625, 3.26776123046875, 3.386688232421875, 3.505615234375, 3.624542236328125, 3.74346923828125, 3.862396240234375, 3.9813232421875, 4.100250244140625, 4.21917724609375, 4.338104248046875, 4.45703125]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 1.0, 5.0, 5.0, 4.0, 5.0, 9.0, 22.0, 8.0, 22.0, 38.0, 49.0, 45.0, 69.0, 97.0, 138.0, 201.0, 343.0, 825.0, 3998.0, 51582.0, 724140.0, 250410.0, 13599.0, 1606.0, 487.0, 269.0, 170.0, 101.0, 77.0, 61.0, 29.0, 27.0, 26.0, 17.0, 15.0, 11.0, 9.0, 7.0, 10.0, 5.0, 4.0, 0.0, 4.0, 0.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.875, -4.7305908203125, -4.586181640625, -4.4417724609375, -4.29736328125, -4.1529541015625, -4.008544921875, -3.8641357421875, -3.7197265625, -3.5753173828125, -3.430908203125, -3.2864990234375, -3.14208984375, -2.9976806640625, -2.853271484375, -2.7088623046875, -2.564453125, -2.4200439453125, -2.275634765625, -2.1312255859375, -1.98681640625, -1.8424072265625, -1.697998046875, -1.5535888671875, -1.4091796875, -1.2647705078125, -1.120361328125, -0.9759521484375, -0.83154296875, -0.6871337890625, -0.542724609375, -0.3983154296875, -0.25390625, -0.1094970703125, 0.034912109375, 0.1793212890625, 0.32373046875, 0.4681396484375, 0.612548828125, 0.7569580078125, 0.9013671875, 1.0457763671875, 1.190185546875, 1.3345947265625, 1.47900390625, 1.6234130859375, 1.767822265625, 1.9122314453125, 2.056640625, 2.2010498046875, 2.345458984375, 2.4898681640625, 2.63427734375, 2.7786865234375, 2.923095703125, 3.0675048828125, 3.2119140625, 3.3563232421875, 3.500732421875, 3.6451416015625, 3.78955078125, 3.9339599609375, 4.078369140625, 4.2227783203125, 4.3671875]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 9.0, 7.0, 5.0, 3.0, 11.0, 14.0, 18.0, 17.0, 21.0, 21.0, 17.0, 34.0, 39.0, 32.0, 33.0, 43.0, 36.0, 43.0, 52.0, 51.0, 52.0, 41.0, 42.0, 45.0, 48.0, 33.0, 33.0, 27.0, 20.0, 25.0, 19.0, 19.0, 21.0, 13.0, 14.0, 10.0, 9.0, 9.0, 3.0, 3.0, 6.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.203125, -4.0670166015625, -3.930908203125, -3.7947998046875, -3.65869140625, -3.5225830078125, -3.386474609375, -3.2503662109375, -3.1142578125, -2.9781494140625, -2.842041015625, -2.7059326171875, -2.56982421875, -2.4337158203125, -2.297607421875, -2.1614990234375, -2.025390625, -1.8892822265625, -1.753173828125, -1.6170654296875, -1.48095703125, -1.3448486328125, -1.208740234375, -1.0726318359375, -0.9365234375, -0.8004150390625, -0.664306640625, -0.5281982421875, -0.39208984375, -0.2559814453125, -0.119873046875, 0.0162353515625, 0.15234375, 0.2884521484375, 0.424560546875, 0.5606689453125, 0.69677734375, 0.8328857421875, 0.968994140625, 1.1051025390625, 1.2412109375, 1.3773193359375, 1.513427734375, 1.6495361328125, 1.78564453125, 1.9217529296875, 2.057861328125, 2.1939697265625, 2.330078125, 2.4661865234375, 2.602294921875, 2.7384033203125, 2.87451171875, 3.0106201171875, 3.146728515625, 3.2828369140625, 3.4189453125, 3.5550537109375, 3.691162109375, 3.8272705078125, 3.96337890625, 4.0994873046875, 4.235595703125, 4.3717041015625, 4.5078125]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 6.0, 9.0, 8.0, 16.0, 24.0, 35.0, 72.0, 186.0, 486.0, 1764.0, 7098.0, 185098.0, 830388.0, 18935.0, 3023.0, 847.0, 293.0, 112.0, 46.0, 26.0, 22.0, 15.0, 10.0, 3.0, 10.0, 4.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-3.306640625, -3.217803955078125, -3.12896728515625, -3.040130615234375, -2.9512939453125, -2.862457275390625, -2.77362060546875, -2.684783935546875, -2.595947265625, -2.507110595703125, -2.41827392578125, -2.329437255859375, -2.2406005859375, -2.151763916015625, -2.06292724609375, -1.974090576171875, -1.88525390625, -1.796417236328125, -1.70758056640625, -1.618743896484375, -1.5299072265625, -1.441070556640625, -1.35223388671875, -1.263397216796875, -1.174560546875, -1.085723876953125, -0.99688720703125, -0.908050537109375, -0.8192138671875, -0.730377197265625, -0.64154052734375, -0.552703857421875, -0.4638671875, -0.375030517578125, -0.28619384765625, -0.197357177734375, -0.1085205078125, -0.019683837890625, 0.06915283203125, 0.157989501953125, 0.246826171875, 0.335662841796875, 0.42449951171875, 0.513336181640625, 0.6021728515625, 0.691009521484375, 0.77984619140625, 0.868682861328125, 0.95751953125, 1.046356201171875, 1.13519287109375, 1.224029541015625, 1.3128662109375, 1.401702880859375, 1.49053955078125, 1.579376220703125, 1.668212890625, 1.757049560546875, 1.84588623046875, 1.934722900390625, 2.0235595703125, 2.112396240234375, 2.20123291015625, 2.290069580078125, 2.37890625]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 1.0, 0.0, 6.0, 3.0, 3.0, 10.0, 14.0, 22.0, 47.0, 84.0, 149.0, 178.0, 197.0, 115.0, 70.0, 46.0, 24.0, 15.0, 8.0, 7.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00037288665771484375, -0.0003618672490119934, -0.00035084784030914307, -0.0003398284316062927, -0.0003288090229034424, -0.00031778961420059204, -0.0003067702054977417, -0.00029575079679489136, -0.000284731388092041, -0.0002737119793891907, -0.00026269257068634033, -0.00025167316198349, -0.00024065375328063965, -0.0002296343445777893, -0.00021861493587493896, -0.00020759552717208862, -0.00019657611846923828, -0.00018555670976638794, -0.0001745373010635376, -0.00016351789236068726, -0.00015249848365783691, -0.00014147907495498657, -0.00013045966625213623, -0.00011944025754928589, -0.00010842084884643555, -9.74014401435852e-05, -8.638203144073486e-05, -7.536262273788452e-05, -6.434321403503418e-05, -5.332380533218384e-05, -4.2304396629333496e-05, -3.1284987926483154e-05, -2.0265579223632812e-05, -9.24617052078247e-06, 1.773238182067871e-06, 1.2792646884918213e-05, 2.3812055587768555e-05, 3.4831464290618896e-05, 4.585087299346924e-05, 5.687028169631958e-05, 6.788969039916992e-05, 7.890909910202026e-05, 8.99285078048706e-05, 0.00010094791650772095, 0.00011196732521057129, 0.00012298673391342163, 0.00013400614261627197, 0.00014502555131912231, 0.00015604496002197266, 0.000167064368724823, 0.00017808377742767334, 0.00018910318613052368, 0.00020012259483337402, 0.00021114200353622437, 0.0002221614122390747, 0.00023318082094192505, 0.0002442002296447754, 0.00025521963834762573, 0.0002662390470504761, 0.0002772584557533264, 0.00028827786445617676, 0.0002992972731590271, 0.00031031668186187744, 0.0003213360905647278, 0.0003323554992675781]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 7.0, 3.0, 5.0, 6.0, 7.0, 7.0, 13.0, 18.0, 35.0, 54.0, 102.0, 197.0, 327.0, 803.0, 2037.0, 6906.0, 85967.0, 866122.0, 75871.0, 6577.0, 1951.0, 796.0, 324.0, 161.0, 93.0, 51.0, 39.0, 17.0, 18.0, 9.0, 3.0, 6.0, 5.0, 1.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-1.8271484375, -1.7554473876953125, -1.683746337890625, -1.6120452880859375, -1.54034423828125, -1.4686431884765625, -1.396942138671875, -1.3252410888671875, -1.2535400390625, -1.1818389892578125, -1.110137939453125, -1.0384368896484375, -0.96673583984375, -0.8950347900390625, -0.823333740234375, -0.7516326904296875, -0.679931640625, -0.6082305908203125, -0.536529541015625, -0.4648284912109375, -0.39312744140625, -0.3214263916015625, -0.249725341796875, -0.1780242919921875, -0.1063232421875, -0.0346221923828125, 0.037078857421875, 0.1087799072265625, 0.18048095703125, 0.2521820068359375, 0.323883056640625, 0.3955841064453125, 0.46728515625, 0.5389862060546875, 0.610687255859375, 0.6823883056640625, 0.75408935546875, 0.8257904052734375, 0.897491455078125, 0.9691925048828125, 1.0408935546875, 1.1125946044921875, 1.184295654296875, 1.2559967041015625, 1.32769775390625, 1.3993988037109375, 1.471099853515625, 1.5428009033203125, 1.614501953125, 1.6862030029296875, 1.757904052734375, 1.8296051025390625, 1.90130615234375, 1.9730072021484375, 2.044708251953125, 2.1164093017578125, 2.1881103515625, 2.2598114013671875, 2.331512451171875, 2.4032135009765625, 2.47491455078125, 2.5466156005859375, 2.618316650390625, 2.6900177001953125, 2.76171875]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 7.0, 8.0, 6.0, 16.0, 14.0, 25.0, 38.0, 51.0, 96.0, 117.0, 110.0, 126.0, 101.0, 76.0, 64.0, 44.0, 31.0, 21.0, 12.0, 9.0, 9.0, 6.0, 3.0, 5.0, 2.0, 2.0, 6.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6015625, -0.5828628540039062, -0.5641632080078125, -0.5454635620117188, -0.526763916015625, -0.5080642700195312, -0.4893646240234375, -0.47066497802734375, -0.45196533203125, -0.43326568603515625, -0.4145660400390625, -0.39586639404296875, -0.377166748046875, -0.35846710205078125, -0.3397674560546875, -0.32106781005859375, -0.3023681640625, -0.28366851806640625, -0.2649688720703125, -0.24626922607421875, -0.227569580078125, -0.20886993408203125, -0.1901702880859375, -0.17147064208984375, -0.15277099609375, -0.13407135009765625, -0.1153717041015625, -0.09667205810546875, -0.077972412109375, -0.05927276611328125, -0.0405731201171875, -0.02187347412109375, -0.003173828125, 0.01552581787109375, 0.0342254638671875, 0.05292510986328125, 0.071624755859375, 0.09032440185546875, 0.1090240478515625, 0.12772369384765625, 0.14642333984375, 0.16512298583984375, 0.1838226318359375, 0.20252227783203125, 0.221221923828125, 0.23992156982421875, 0.2586212158203125, 0.27732086181640625, 0.2960205078125, 0.31472015380859375, 0.3334197998046875, 0.35211944580078125, 0.370819091796875, 0.38951873779296875, 0.4082183837890625, 0.42691802978515625, 0.44561767578125, 0.46431732177734375, 0.4830169677734375, 0.5017166137695312, 0.520416259765625, 0.5391159057617188, 0.5578155517578125, 0.5765151977539062, 0.59521484375]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 17.0, 49.0, 149.0, 292.0, 307.0, 133.0, 47.0, 7.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.72396469116211, -29.14010238647461, -28.556238174438477, -27.972375869750977, -27.388513565063477, -26.804651260375977, -26.220787048339844, -25.636924743652344, -25.053062438964844, -24.469200134277344, -23.88533592224121, -23.30147361755371, -22.71761131286621, -22.13374900817871, -21.549884796142578, -20.966022491455078, -20.382160186767578, -19.798297882080078, -19.214433670043945, -18.630571365356445, -18.046709060668945, -17.462846755981445, -16.878982543945312, -16.295120239257812, -15.71125602722168, -15.127392768859863, -14.543530464172363, -13.959667205810547, -13.375804901123047, -12.79194164276123, -12.208078384399414, -11.624216079711914, -11.040355682373047, -10.45649242401123, -9.87263011932373, -9.288766860961914, -8.704904556274414, -8.121041297912598, -7.5371785163879395, -6.953315734863281, -6.369452476501465, -5.785589694976807, -5.201726913452148, -4.617863655090332, -4.034001350402832, -3.4501383304595947, -2.8662753105163574, -2.282412528991699, -1.698549747467041, -1.1146869659423828, -0.5308240652084351, 0.053038835525512695, 0.6369016170501709, 1.220764398574829, 1.8046274185180664, 2.3884902000427246, 2.972352981567383, 3.556215763092041, 4.140078544616699, 4.723941802978516, 5.307804107666016, 5.891667366027832, 6.47553014755249, 7.059392929077148, 7.643255710601807]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 4.0, 9.0, 4.0, 10.0, 7.0, 13.0, 12.0, 21.0, 18.0, 18.0, 32.0, 34.0, 23.0, 26.0, 33.0, 46.0, 39.0, 36.0, 36.0, 38.0, 39.0, 46.0, 37.0, 31.0, 43.0, 39.0, 26.0, 23.0, 39.0, 24.0, 26.0, 21.0, 20.0, 20.0, 15.0, 16.0, 18.0, 6.0, 8.0, 4.0, 14.0, 7.0, 6.0, 10.0, 2.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.120534896850586, -5.917450428009033, -5.7143659591674805, -5.5112810134887695, -5.308196544647217, -5.105112075805664, -4.902027130126953, -4.6989426612854, -4.495858192443848, -4.292773723602295, -4.089689254760742, -3.8866043090820312, -3.6835198402404785, -3.480435371398926, -3.277350664138794, -3.074265956878662, -2.8711814880371094, -2.6680970191955566, -2.465012311935425, -2.261927604675293, -2.0588431358337402, -1.855758547782898, -1.6526739597320557, -1.4495893716812134, -1.246504783630371, -1.0434201955795288, -0.8403356075286865, -0.6372510194778442, -0.43416643142700195, -0.23108184337615967, -0.027997255325317383, 0.1750873327255249, 0.3781719207763672, 0.5812565088272095, 0.7843410968780518, 0.987425684928894, 1.1905102729797363, 1.3935948610305786, 1.596679449081421, 1.7997640371322632, 2.0028486251831055, 2.205933094024658, 2.40901780128479, 2.612102508544922, 2.8151869773864746, 3.0182714462280273, 3.221356153488159, 3.424440860748291, 3.6275253295898438, 3.8306097984313965, 4.033694267272949, 4.23677921295166, 4.439863681793213, 4.642948150634766, 4.846033096313477, 5.049117565155029, 5.252202033996582, 5.455286502838135, 5.6583709716796875, 5.861455917358398, 6.064540386199951, 6.267624855041504, 6.470709800720215, 6.673794269561768, 6.87687873840332]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 4.0, 4.0, 8.0, 14.0, 15.0, 28.0, 31.0, 42.0, 74.0, 120.0, 143.0, 215.0, 390.0, 778.0, 1995.0, 9057.0, 80389.0, 1338919.0, 2548805.0, 193484.0, 15849.0, 2477.0, 672.0, 264.0, 155.0, 94.0, 70.0, 53.0, 29.0, 28.0, 16.0, 16.0, 8.0, 12.0, 6.0, 9.0, 2.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.66015625, -4.5003662109375, -4.340576171875, -4.1807861328125, -4.02099609375, -3.8612060546875, -3.701416015625, -3.5416259765625, -3.3818359375, -3.2220458984375, -3.062255859375, -2.9024658203125, -2.74267578125, -2.5828857421875, -2.423095703125, -2.2633056640625, -2.103515625, -1.9437255859375, -1.783935546875, -1.6241455078125, -1.46435546875, -1.3045654296875, -1.144775390625, -0.9849853515625, -0.8251953125, -0.6654052734375, -0.505615234375, -0.3458251953125, -0.18603515625, -0.0262451171875, 0.133544921875, 0.2933349609375, 0.453125, 0.6129150390625, 0.772705078125, 0.9324951171875, 1.09228515625, 1.2520751953125, 1.411865234375, 1.5716552734375, 1.7314453125, 1.8912353515625, 2.051025390625, 2.2108154296875, 2.37060546875, 2.5303955078125, 2.690185546875, 2.8499755859375, 3.009765625, 3.1695556640625, 3.329345703125, 3.4891357421875, 3.64892578125, 3.8087158203125, 3.968505859375, 4.1282958984375, 4.2880859375, 4.4478759765625, 4.607666015625, 4.7674560546875, 4.92724609375, 5.0870361328125, 5.246826171875, 5.4066162109375, 5.56640625]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 7.0, 5.0, 4.0, 10.0, 8.0, 17.0, 16.0, 34.0, 25.0, 48.0, 42.0, 49.0, 46.0, 46.0, 68.0, 70.0, 79.0, 58.0, 63.0, 58.0, 49.0, 44.0, 35.0, 23.0, 20.0, 23.0, 18.0, 11.0, 7.0, 11.0, 5.0, 3.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.421875, -2.32513427734375, -2.2283935546875, -2.13165283203125, -2.034912109375, -1.93817138671875, -1.8414306640625, -1.74468994140625, -1.64794921875, -1.55120849609375, -1.4544677734375, -1.35772705078125, -1.260986328125, -1.16424560546875, -1.0675048828125, -0.97076416015625, -0.8740234375, -0.77728271484375, -0.6805419921875, -0.58380126953125, -0.487060546875, -0.39031982421875, -0.2935791015625, -0.19683837890625, -0.10009765625, -0.00335693359375, 0.0933837890625, 0.19012451171875, 0.286865234375, 0.38360595703125, 0.4803466796875, 0.57708740234375, 0.673828125, 0.77056884765625, 0.8673095703125, 0.96405029296875, 1.060791015625, 1.15753173828125, 1.2542724609375, 1.35101318359375, 1.44775390625, 1.54449462890625, 1.6412353515625, 1.73797607421875, 1.834716796875, 1.93145751953125, 2.0281982421875, 2.12493896484375, 2.2216796875, 2.31842041015625, 2.4151611328125, 2.51190185546875, 2.608642578125, 2.70538330078125, 2.8021240234375, 2.89886474609375, 2.99560546875, 3.09234619140625, 3.1890869140625, 3.28582763671875, 3.382568359375, 3.47930908203125, 3.5760498046875, 3.67279052734375, 3.76953125]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 3.0, 13.0, 21.0, 14.0, 28.0, 35.0, 55.0, 78.0, 127.0, 178.0, 262.0, 431.0, 740.0, 1506.0, 3551.0, 11711.0, 64129.0, 667702.0, 2978303.0, 404985.0, 44913.0, 9234.0, 2946.0, 1373.0, 710.0, 418.0, 256.0, 172.0, 122.0, 72.0, 54.0, 40.0, 31.0, 24.0, 19.0, 12.0, 4.0, 2.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-3.166015625, -3.058349609375, -2.95068359375, -2.843017578125, -2.7353515625, -2.627685546875, -2.52001953125, -2.412353515625, -2.3046875, -2.197021484375, -2.08935546875, -1.981689453125, -1.8740234375, -1.766357421875, -1.65869140625, -1.551025390625, -1.443359375, -1.335693359375, -1.22802734375, -1.120361328125, -1.0126953125, -0.905029296875, -0.79736328125, -0.689697265625, -0.58203125, -0.474365234375, -0.36669921875, -0.259033203125, -0.1513671875, -0.043701171875, 0.06396484375, 0.171630859375, 0.279296875, 0.386962890625, 0.49462890625, 0.602294921875, 0.7099609375, 0.817626953125, 0.92529296875, 1.032958984375, 1.140625, 1.248291015625, 1.35595703125, 1.463623046875, 1.5712890625, 1.678955078125, 1.78662109375, 1.894287109375, 2.001953125, 2.109619140625, 2.21728515625, 2.324951171875, 2.4326171875, 2.540283203125, 2.64794921875, 2.755615234375, 2.86328125, 2.970947265625, 3.07861328125, 3.186279296875, 3.2939453125, 3.401611328125, 3.50927734375, 3.616943359375, 3.724609375]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 1.0, 2.0, 3.0, 3.0, 1.0, 10.0, 7.0, 10.0, 16.0, 31.0, 15.0, 32.0, 58.0, 64.0, 91.0, 130.0, 191.0, 241.0, 354.0, 403.0, 471.0, 483.0, 425.0, 297.0, 219.0, 144.0, 106.0, 68.0, 57.0, 39.0, 22.0, 25.0, 18.0, 12.0, 11.0, 4.0, 5.0, 8.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.2265625, -1.1948623657226562, -1.1631622314453125, -1.1314620971679688, -1.099761962890625, -1.0680618286132812, -1.0363616943359375, -1.0046615600585938, -0.97296142578125, -0.9412612915039062, -0.9095611572265625, -0.8778610229492188, -0.846160888671875, -0.8144607543945312, -0.7827606201171875, -0.7510604858398438, -0.7193603515625, -0.6876602172851562, -0.6559600830078125, -0.6242599487304688, -0.592559814453125, -0.5608596801757812, -0.5291595458984375, -0.49745941162109375, -0.46575927734375, -0.43405914306640625, -0.4023590087890625, -0.37065887451171875, -0.338958740234375, -0.30725860595703125, -0.2755584716796875, -0.24385833740234375, -0.212158203125, -0.18045806884765625, -0.1487579345703125, -0.11705780029296875, -0.085357666015625, -0.05365753173828125, -0.0219573974609375, 0.00974273681640625, 0.04144287109375, 0.07314300537109375, 0.1048431396484375, 0.13654327392578125, 0.168243408203125, 0.19994354248046875, 0.2316436767578125, 0.26334381103515625, 0.2950439453125, 0.32674407958984375, 0.3584442138671875, 0.39014434814453125, 0.421844482421875, 0.45354461669921875, 0.4852447509765625, 0.5169448852539062, 0.54864501953125, 0.5803451538085938, 0.6120452880859375, 0.6437454223632812, 0.675445556640625, 0.7071456909179688, 0.7388458251953125, 0.7705459594726562, 0.80224609375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 4.0, 6.0, 10.0, 11.0, 32.0, 32.0, 41.0, 50.0, 66.0, 89.0, 99.0, 93.0, 107.0, 92.0, 73.0, 60.0, 44.0, 29.0, 27.0, 19.0, 8.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.473639965057373, -5.331472873687744, -5.189305305480957, -5.047138214111328, -4.904971122741699, -4.76280403137207, -4.620636940002441, -4.478469371795654, -4.336302280426025, -4.1941351890563965, -4.051967620849609, -3.9098005294799805, -3.7676334381103516, -3.6254663467407227, -3.4832990169525146, -3.3411316871643066, -3.1989645957946777, -3.056797504425049, -2.914630174636841, -2.772462844848633, -2.630295753479004, -2.488128662109375, -2.345961332321167, -2.203794002532959, -2.06162691116333, -1.9194597005844116, -1.7772924900054932, -1.6351252794265747, -1.4929580688476562, -1.3507908582687378, -1.2086236476898193, -1.0664564371109009, -0.9242887496948242, -0.7821215391159058, -0.6399543285369873, -0.49778711795806885, -0.3556199073791504, -0.21345269680023193, -0.07128548622131348, 0.07088172435760498, 0.21304893493652344, 0.3552161455154419, 0.49738335609436035, 0.6395505666732788, 0.7817177772521973, 0.9238849878311157, 1.0660521984100342, 1.2082194089889526, 1.350386619567871, 1.4925538301467896, 1.634721040725708, 1.7768882513046265, 1.919055461883545, 2.061222553253174, 2.203389883041382, 2.34555721282959, 2.4877243041992188, 2.6298913955688477, 2.7720587253570557, 2.9142260551452637, 3.0563931465148926, 3.1985602378845215, 3.3407275676727295, 3.4828948974609375, 3.6250619888305664]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 6.0, 2.0, 5.0, 5.0, 2.0, 7.0, 6.0, 12.0, 19.0, 16.0, 25.0, 15.0, 29.0, 27.0, 32.0, 38.0, 47.0, 41.0, 39.0, 39.0, 45.0, 42.0, 47.0, 64.0, 48.0, 51.0, 37.0, 31.0, 30.0, 35.0, 34.0, 34.0, 20.0, 12.0, 14.0, 14.0, 8.0, 9.0, 6.0, 8.0, 3.0, 5.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9903507232666016, -1.9063572883605957, -1.8223639726638794, -1.7383705377578735, -1.6543771028518677, -1.5703837871551514, -1.4863903522491455, -1.4023969173431396, -1.3184034824371338, -1.234410047531128, -1.1504167318344116, -1.0664232969284058, -0.9824298620223999, -0.8984364867210388, -0.8144431114196777, -0.7304496765136719, -0.6464563608169556, -0.5624629855155945, -0.4784695506095886, -0.39447617530822754, -0.31048277020454407, -0.2264893651008606, -0.1424959897994995, -0.05850255489349365, 0.02549082040786743, 0.1094842180609703, 0.19347761571407318, 0.27747100591659546, 0.36146441102027893, 0.4454578161239624, 0.5294511914253235, 0.6134446263313293, 0.6974380016326904, 0.7814313769340515, 0.8654248118400574, 0.9494181871414185, 1.0334116220474243, 1.1174049377441406, 1.2013983726501465, 1.2853918075561523, 1.3693852424621582, 1.453378677368164, 1.5373719930648804, 1.6213654279708862, 1.705358862876892, 1.7893521785736084, 1.8733456134796143, 1.9573390483856201, 2.041332244873047, 2.1253256797790527, 2.2093191146850586, 2.2933125495910645, 2.377305746078491, 2.461299180984497, 2.545292615890503, 2.629286050796509, 2.7132794857025146, 2.7972729206085205, 2.8812663555145264, 2.965259552001953, 3.049252986907959, 3.133246421813965, 3.2172398567199707, 3.3012332916259766, 3.3852267265319824]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 2.0, 4.0, 9.0, 8.0, 14.0, 27.0, 33.0, 52.0, 96.0, 138.0, 268.0, 379.0, 919.0, 1972.0, 4871.0, 13039.0, 40157.0, 129187.0, 337371.0, 333228.0, 126188.0, 39141.0, 12931.0, 4717.0, 1906.0, 886.0, 414.0, 240.0, 132.0, 78.0, 56.0, 28.0, 32.0, 19.0, 5.0, 6.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.54638671875, -0.5287551879882812, -0.5111236572265625, -0.49349212646484375, -0.475860595703125, -0.45822906494140625, -0.4405975341796875, -0.42296600341796875, -0.40533447265625, -0.38770294189453125, -0.3700714111328125, -0.35243988037109375, -0.334808349609375, -0.31717681884765625, -0.2995452880859375, -0.28191375732421875, -0.2642822265625, -0.24665069580078125, -0.2290191650390625, -0.21138763427734375, -0.193756103515625, -0.17612457275390625, -0.1584930419921875, -0.14086151123046875, -0.12322998046875, -0.10559844970703125, -0.0879669189453125, -0.07033538818359375, -0.052703857421875, -0.03507232666015625, -0.0174407958984375, 0.00019073486328125, 0.017822265625, 0.03545379638671875, 0.0530853271484375, 0.07071685791015625, 0.088348388671875, 0.10597991943359375, 0.1236114501953125, 0.14124298095703125, 0.15887451171875, 0.17650604248046875, 0.1941375732421875, 0.21176910400390625, 0.229400634765625, 0.24703216552734375, 0.2646636962890625, 0.28229522705078125, 0.2999267578125, 0.31755828857421875, 0.3351898193359375, 0.35282135009765625, 0.370452880859375, 0.38808441162109375, 0.4057159423828125, 0.42334747314453125, 0.44097900390625, 0.45861053466796875, 0.4762420654296875, 0.49387359619140625, 0.511505126953125, 0.5291366577148438, 0.5467681884765625, 0.5643997192382812, 0.58203125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 6.0, 2.0, 6.0, 5.0, 11.0, 17.0, 18.0, 28.0, 20.0, 36.0, 43.0, 36.0, 42.0, 53.0, 71.0, 80.0, 61.0, 55.0, 48.0, 62.0, 53.0, 47.0, 48.0, 23.0, 36.0, 33.0, 19.0, 11.0, 7.0, 12.0, 4.0, 8.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.75, -1.673248291015625, -1.59649658203125, -1.519744873046875, -1.4429931640625, -1.366241455078125, -1.28948974609375, -1.212738037109375, -1.135986328125, -1.059234619140625, -0.98248291015625, -0.905731201171875, -0.8289794921875, -0.752227783203125, -0.67547607421875, -0.598724365234375, -0.52197265625, -0.445220947265625, -0.36846923828125, -0.291717529296875, -0.2149658203125, -0.138214111328125, -0.06146240234375, 0.015289306640625, 0.092041015625, 0.168792724609375, 0.24554443359375, 0.322296142578125, 0.3990478515625, 0.475799560546875, 0.55255126953125, 0.629302978515625, 0.7060546875, 0.782806396484375, 0.85955810546875, 0.936309814453125, 1.0130615234375, 1.089813232421875, 1.16656494140625, 1.243316650390625, 1.320068359375, 1.396820068359375, 1.47357177734375, 1.550323486328125, 1.6270751953125, 1.703826904296875, 1.78057861328125, 1.857330322265625, 1.93408203125, 2.010833740234375, 2.08758544921875, 2.164337158203125, 2.2410888671875, 2.317840576171875, 2.39459228515625, 2.471343994140625, 2.548095703125, 2.624847412109375, 2.70159912109375, 2.778350830078125, 2.8551025390625, 2.931854248046875, 3.00860595703125, 3.085357666015625, 3.162109375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 5.0, 3.0, 12.0, 11.0, 14.0, 25.0, 34.0, 50.0, 85.0, 126.0, 196.0, 317.0, 491.0, 708.0, 1145.0, 1761.0, 2914.0, 4619.0, 7538.0, 11819.0, 19030.0, 29740.0, 46383.0, 71340.0, 105166.0, 141018.0, 157844.0, 141102.0, 105637.0, 72048.0, 46719.0, 29707.0, 18887.0, 12044.0, 7547.0, 4504.0, 2871.0, 1812.0, 1188.0, 748.0, 474.0, 315.0, 203.0, 112.0, 82.0, 60.0, 33.0, 29.0, 14.0, 8.0, 5.0, 8.0, 5.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1788330078125, -0.1727733612060547, -0.16671371459960938, -0.16065406799316406, -0.15459442138671875, -0.14853477478027344, -0.14247512817382812, -0.1364154815673828, -0.1303558349609375, -0.12429618835449219, -0.11823654174804688, -0.11217689514160156, -0.10611724853515625, -0.10005760192871094, -0.09399795532226562, -0.08793830871582031, -0.081878662109375, -0.07581901550292969, -0.06975936889648438, -0.06369972229003906, -0.05764007568359375, -0.05158042907714844, -0.045520782470703125, -0.03946113586425781, -0.0334014892578125, -0.027341842651367188, -0.021282196044921875, -0.015222549438476562, -0.00916290283203125, -0.0031032562255859375, 0.002956390380859375, 0.009016036987304688, 0.01507568359375, 0.021135330200195312, 0.027194976806640625, 0.03325462341308594, 0.03931427001953125, 0.04537391662597656, 0.051433563232421875, 0.05749320983886719, 0.0635528564453125, 0.06961250305175781, 0.07567214965820312, 0.08173179626464844, 0.08779144287109375, 0.09385108947753906, 0.09991073608398438, 0.10597038269042969, 0.112030029296875, 0.11808967590332031, 0.12414932250976562, 0.13020896911621094, 0.13626861572265625, 0.14232826232910156, 0.14838790893554688, 0.1544475555419922, 0.1605072021484375, 0.1665668487548828, 0.17262649536132812, 0.17868614196777344, 0.18474578857421875, 0.19080543518066406, 0.19686508178710938, 0.2029247283935547, 0.208984375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 6.0, 4.0, 9.0, 11.0, 16.0, 12.0, 12.0, 20.0, 29.0, 24.0, 20.0, 28.0, 27.0, 30.0, 46.0, 51.0, 44.0, 52.0, 61.0, 60.0, 43.0, 41.0, 40.0, 47.0, 38.0, 27.0, 25.0, 26.0, 22.0, 23.0, 18.0, 17.0, 12.0, 17.0, 15.0, 12.0, 10.0, 3.0, 6.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.279296875, -3.164581298828125, -3.04986572265625, -2.935150146484375, -2.8204345703125, -2.705718994140625, -2.59100341796875, -2.476287841796875, -2.361572265625, -2.246856689453125, -2.13214111328125, -2.017425537109375, -1.9027099609375, -1.787994384765625, -1.67327880859375, -1.558563232421875, -1.44384765625, -1.329132080078125, -1.21441650390625, -1.099700927734375, -0.9849853515625, -0.870269775390625, -0.75555419921875, -0.640838623046875, -0.526123046875, -0.411407470703125, -0.29669189453125, -0.181976318359375, -0.0672607421875, 0.047454833984375, 0.16217041015625, 0.276885986328125, 0.3916015625, 0.506317138671875, 0.62103271484375, 0.735748291015625, 0.8504638671875, 0.965179443359375, 1.07989501953125, 1.194610595703125, 1.309326171875, 1.424041748046875, 1.53875732421875, 1.653472900390625, 1.7681884765625, 1.882904052734375, 1.99761962890625, 2.112335205078125, 2.22705078125, 2.341766357421875, 2.45648193359375, 2.571197509765625, 2.6859130859375, 2.800628662109375, 2.91534423828125, 3.030059814453125, 3.144775390625, 3.259490966796875, 3.37420654296875, 3.488922119140625, 3.6036376953125, 3.718353271484375, 3.83306884765625, 3.947784423828125, 4.0625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 3.0, 4.0, 2.0, 7.0, 8.0, 14.0, 12.0, 18.0, 29.0, 37.0, 57.0, 86.0, 113.0, 210.0, 304.0, 524.0, 1009.0, 2084.0, 5286.0, 17541.0, 70156.0, 275778.0, 444150.0, 171466.0, 41214.0, 11092.0, 3845.0, 1617.0, 773.0, 390.0, 243.0, 156.0, 103.0, 66.0, 46.0, 34.0, 21.0, 21.0, 12.0, 5.0, 12.0, 6.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.048797607421875, -0.04694318771362305, -0.045088768005371094, -0.04323434829711914, -0.04137992858886719, -0.039525508880615234, -0.03767108917236328, -0.03581666946411133, -0.033962249755859375, -0.03210783004760742, -0.03025341033935547, -0.028398990631103516, -0.026544570922851562, -0.02469015121459961, -0.022835731506347656, -0.020981311798095703, -0.01912689208984375, -0.017272472381591797, -0.015418052673339844, -0.01356363296508789, -0.011709213256835938, -0.009854793548583984, -0.008000373840332031, -0.006145954132080078, -0.004291534423828125, -0.002437114715576172, -0.0005826950073242188, 0.0012717247009277344, 0.0031261444091796875, 0.004980564117431641, 0.006834983825683594, 0.008689403533935547, 0.0105438232421875, 0.012398242950439453, 0.014252662658691406, 0.01610708236694336, 0.017961502075195312, 0.019815921783447266, 0.02167034149169922, 0.023524761199951172, 0.025379180908203125, 0.027233600616455078, 0.02908802032470703, 0.030942440032958984, 0.03279685974121094, 0.03465127944946289, 0.036505699157714844, 0.0383601188659668, 0.04021453857421875, 0.0420689582824707, 0.043923377990722656, 0.04577779769897461, 0.04763221740722656, 0.049486637115478516, 0.05134105682373047, 0.05319547653198242, 0.055049896240234375, 0.05690431594848633, 0.05875873565673828, 0.060613155364990234, 0.06246757507324219, 0.06432199478149414, 0.0661764144897461, 0.06803083419799805, 0.06988525390625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 5.0, 4.0, 12.0, 7.0, 29.0, 46.0, 68.0, 115.0, 126.0, 138.0, 150.0, 125.0, 77.0, 34.0, 32.0, 18.0, 13.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.8995018005371094e-05, -4.674401134252548e-05, -4.449300467967987e-05, -4.224199801683426e-05, -3.999099135398865e-05, -3.7739984691143036e-05, -3.5488978028297424e-05, -3.323797136545181e-05, -3.09869647026062e-05, -2.873595803976059e-05, -2.6484951376914978e-05, -2.4233944714069366e-05, -2.1982938051223755e-05, -1.9731931388378143e-05, -1.7480924725532532e-05, -1.522991806268692e-05, -1.2978911399841309e-05, -1.0727904736995697e-05, -8.476898074150085e-06, -6.225891411304474e-06, -3.974884748458862e-06, -1.7238780856132507e-06, 5.271285772323608e-07, 2.7781352400779724e-06, 5.029141902923584e-06, 7.2801485657691956e-06, 9.531155228614807e-06, 1.1782161891460419e-05, 1.403316855430603e-05, 1.6284175217151642e-05, 1.8535181879997253e-05, 2.0786188542842865e-05, 2.3037195205688477e-05, 2.5288201868534088e-05, 2.75392085313797e-05, 2.979021519422531e-05, 3.204122185707092e-05, 3.4292228519916534e-05, 3.6543235182762146e-05, 3.879424184560776e-05, 4.104524850845337e-05, 4.329625517129898e-05, 4.554726183414459e-05, 4.7798268496990204e-05, 5.0049275159835815e-05, 5.230028182268143e-05, 5.455128848552704e-05, 5.680229514837265e-05, 5.905330181121826e-05, 6.130430847406387e-05, 6.355531513690948e-05, 6.58063217997551e-05, 6.805732846260071e-05, 7.030833512544632e-05, 7.255934178829193e-05, 7.481034845113754e-05, 7.706135511398315e-05, 7.931236177682877e-05, 8.156336843967438e-05, 8.381437510251999e-05, 8.60653817653656e-05, 8.831638842821121e-05, 9.056739509105682e-05, 9.281840175390244e-05, 9.506940841674805e-05]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 6.0, 4.0, 5.0, 7.0, 4.0, 17.0, 22.0, 30.0, 41.0, 42.0, 68.0, 105.0, 174.0, 314.0, 556.0, 1181.0, 2614.0, 6800.0, 18623.0, 54137.0, 159157.0, 345160.0, 287296.0, 112392.0, 37786.0, 13044.0, 4932.0, 2005.0, 917.0, 437.0, 250.0, 133.0, 97.0, 49.0, 39.0, 33.0, 18.0, 18.0, 12.0, 5.0, 9.0, 8.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-0.045928955078125, -0.0445713996887207, -0.043213844299316406, -0.04185628890991211, -0.04049873352050781, -0.039141178131103516, -0.03778362274169922, -0.03642606735229492, -0.035068511962890625, -0.03371095657348633, -0.03235340118408203, -0.030995845794677734, -0.029638290405273438, -0.02828073501586914, -0.026923179626464844, -0.025565624237060547, -0.02420806884765625, -0.022850513458251953, -0.021492958068847656, -0.02013540267944336, -0.018777847290039062, -0.017420291900634766, -0.01606273651123047, -0.014705181121826172, -0.013347625732421875, -0.011990070343017578, -0.010632514953613281, -0.009274959564208984, -0.007917404174804688, -0.006559848785400391, -0.005202293395996094, -0.003844738006591797, -0.0024871826171875, -0.0011296272277832031, 0.00022792816162109375, 0.0015854835510253906, 0.0029430389404296875, 0.004300594329833984, 0.005658149719238281, 0.007015705108642578, 0.008373260498046875, 0.009730815887451172, 0.011088371276855469, 0.012445926666259766, 0.013803482055664062, 0.01516103744506836, 0.016518592834472656, 0.017876148223876953, 0.01923370361328125, 0.020591259002685547, 0.021948814392089844, 0.02330636978149414, 0.024663925170898438, 0.026021480560302734, 0.02737903594970703, 0.028736591339111328, 0.030094146728515625, 0.03145170211791992, 0.03280925750732422, 0.034166812896728516, 0.03552436828613281, 0.03688192367553711, 0.038239479064941406, 0.0395970344543457, 0.04095458984375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 4.0, 4.0, 6.0, 2.0, 4.0, 6.0, 4.0, 12.0, 12.0, 19.0, 26.0, 26.0, 26.0, 36.0, 43.0, 55.0, 59.0, 56.0, 65.0, 70.0, 70.0, 60.0, 63.0, 50.0, 43.0, 42.0, 26.0, 25.0, 12.0, 16.0, 10.0, 10.0, 13.0, 8.0, 7.0, 3.0, 4.0, 3.0, 1.0, 3.0, 4.0, 1.0], "bins": [-0.0199432373046875, -0.01945960521697998, -0.01897597312927246, -0.01849234104156494, -0.018008708953857422, -0.017525076866149902, -0.017041444778442383, -0.016557812690734863, -0.016074180603027344, -0.015590548515319824, -0.015106916427612305, -0.014623284339904785, -0.014139652252197266, -0.013656020164489746, -0.013172388076782227, -0.012688755989074707, -0.012205123901367188, -0.011721491813659668, -0.011237859725952148, -0.010754227638244629, -0.01027059555053711, -0.00978696346282959, -0.00930333137512207, -0.00881969928741455, -0.008336067199707031, -0.007852435111999512, -0.007368803024291992, -0.006885170936584473, -0.006401538848876953, -0.005917906761169434, -0.005434274673461914, -0.0049506425857543945, -0.004467010498046875, -0.0039833784103393555, -0.003499746322631836, -0.0030161142349243164, -0.002532482147216797, -0.0020488500595092773, -0.0015652179718017578, -0.0010815858840942383, -0.0005979537963867188, -0.00011432170867919922, 0.0003693103790283203, 0.0008529424667358398, 0.0013365745544433594, 0.001820206642150879, 0.0023038387298583984, 0.002787470817565918, 0.0032711029052734375, 0.003754734992980957, 0.0042383670806884766, 0.004721999168395996, 0.005205631256103516, 0.005689263343811035, 0.006172895431518555, 0.006656527519226074, 0.007140159606933594, 0.007623791694641113, 0.008107423782348633, 0.008591055870056152, 0.009074687957763672, 0.009558320045471191, 0.010041952133178711, 0.01052558422088623, 0.01100921630859375]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 7.0, 8.0, 41.0, 97.0, 197.0, 254.0, 221.0, 121.0, 44.0, 15.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.412555694580078, -9.185964584350586, -8.95937442779541, -8.732783317565918, -8.506192207336426, -8.279601097106934, -8.053010940551758, -7.826419830322266, -7.599828720092773, -7.3732380867004395, -7.146646976470947, -6.920056343078613, -6.693465232849121, -6.466874599456787, -6.240283966064453, -6.013692855834961, -5.787102222442627, -5.560511589050293, -5.333920478820801, -5.107329845428467, -4.880738735198975, -4.654148101806641, -4.427556991577148, -4.2009663581848145, -3.9743754863739014, -3.7477846145629883, -3.521193742752075, -3.294602870941162, -3.068012237548828, -2.841421127319336, -2.614830493927002, -2.388239622116089, -2.161648750305176, -1.9350578784942627, -1.7084670066833496, -1.481876254081726, -1.255285382270813, -1.0286945104599, -0.8021037578582764, -0.5755128860473633, -0.3489220142364502, -0.1223311722278595, 0.1042596697807312, 0.3308504819869995, 0.5574413537979126, 0.7840322256088257, 1.0106229782104492, 1.2372138500213623, 1.4638047218322754, 1.6903955936431885, 1.9169864654541016, 2.1435770988464355, 2.3701682090759277, 2.5967588424682617, 2.823349714279175, 3.049940586090088, 3.276531457901001, 3.503122329711914, 3.729713201522827, 3.9563040733337402, 4.182894706726074, 4.409485816955566, 4.6360764503479, 4.862667083740234, 5.089258193969727]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 4.0, 3.0, 4.0, 5.0, 5.0, 7.0, 12.0, 11.0, 20.0, 24.0, 22.0, 34.0, 30.0, 38.0, 52.0, 50.0, 53.0, 48.0, 47.0, 59.0, 72.0, 53.0, 59.0, 45.0, 40.0, 38.0, 39.0, 31.0, 24.0, 22.0, 14.0, 13.0, 10.0, 7.0, 2.0, 6.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5494000911712646, -1.480488896369934, -1.4115777015686035, -1.342666506767273, -1.2737553119659424, -1.2048442363739014, -1.1359330415725708, -1.0670218467712402, -0.9981106519699097, -0.9291994571685791, -0.8602882623672485, -0.7913771271705627, -0.7224659323692322, -0.6535547375679016, -0.5846436023712158, -0.5157324075698853, -0.4468212127685547, -0.3779100179672241, -0.30899885296821594, -0.24008767306804657, -0.1711764931678772, -0.10226529836654663, -0.03335413336753845, 0.03555703163146973, 0.10446822643280029, 0.17337940633296967, 0.24229058623313904, 0.3112017512321472, 0.3801129460334778, 0.44902414083480835, 0.5179352760314941, 0.5868464708328247, 0.6557574272155762, 0.7246686220169067, 0.7935798168182373, 0.8624909520149231, 0.9314021468162537, 1.0003132820129395, 1.06922447681427, 1.1381356716156006, 1.2070468664169312, 1.2759580612182617, 1.3448692560195923, 1.4137804508209229, 1.4826915264129639, 1.551602840423584, 1.620513916015625, 1.6894251108169556, 1.7583363056182861, 1.8272475004196167, 1.8961586952209473, 1.9650698900222778, 2.0339810848236084, 2.1028921604156494, 2.1718034744262695, 2.2407145500183105, 2.3096256256103516, 2.3785367012023926, 2.4474480152130127, 2.5163590908050537, 2.585270404815674, 2.654181480407715, 2.723092794418335, 2.792003870010376, 2.860915184020996]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 5.0, 7.0, 13.0, 14.0, 19.0, 43.0, 64.0, 107.0, 203.0, 438.0, 901.0, 2148.0, 4915.0, 13911.0, 45578.0, 179110.0, 519140.0, 205393.0, 51631.0, 15369.0, 5471.0, 2137.0, 974.0, 444.0, 219.0, 127.0, 74.0, 36.0, 14.0, 19.0, 13.0, 10.0, 3.0, 1.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.37890625, -2.311981201171875, -2.24505615234375, -2.178131103515625, -2.1112060546875, -2.044281005859375, -1.97735595703125, -1.910430908203125, -1.843505859375, -1.776580810546875, -1.70965576171875, -1.642730712890625, -1.5758056640625, -1.508880615234375, -1.44195556640625, -1.375030517578125, -1.30810546875, -1.241180419921875, -1.17425537109375, -1.107330322265625, -1.0404052734375, -0.973480224609375, -0.90655517578125, -0.839630126953125, -0.772705078125, -0.705780029296875, -0.63885498046875, -0.571929931640625, -0.5050048828125, -0.438079833984375, -0.37115478515625, -0.304229736328125, -0.2373046875, -0.170379638671875, -0.10345458984375, -0.036529541015625, 0.0303955078125, 0.097320556640625, 0.16424560546875, 0.231170654296875, 0.298095703125, 0.365020751953125, 0.43194580078125, 0.498870849609375, 0.5657958984375, 0.632720947265625, 0.69964599609375, 0.766571044921875, 0.83349609375, 0.900421142578125, 0.96734619140625, 1.034271240234375, 1.1011962890625, 1.168121337890625, 1.23504638671875, 1.301971435546875, 1.368896484375, 1.435821533203125, 1.50274658203125, 1.569671630859375, 1.6365966796875, 1.703521728515625, 1.77044677734375, 1.837371826171875, 1.904296875]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 7.0, 4.0, 5.0, 7.0, 5.0, 6.0, 14.0, 16.0, 12.0, 23.0, 22.0, 41.0, 30.0, 49.0, 50.0, 52.0, 48.0, 52.0, 50.0, 66.0, 69.0, 48.0, 52.0, 39.0, 42.0, 42.0, 21.0, 25.0, 18.0, 25.0, 13.0, 17.0, 11.0, 12.0, 6.0, 5.0, 5.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.513671875, -3.389129638671875, -3.26458740234375, -3.140045166015625, -3.0155029296875, -2.890960693359375, -2.76641845703125, -2.641876220703125, -2.517333984375, -2.392791748046875, -2.26824951171875, -2.143707275390625, -2.0191650390625, -1.894622802734375, -1.77008056640625, -1.645538330078125, -1.52099609375, -1.396453857421875, -1.27191162109375, -1.147369384765625, -1.0228271484375, -0.898284912109375, -0.77374267578125, -0.649200439453125, -0.524658203125, -0.400115966796875, -0.27557373046875, -0.151031494140625, -0.0264892578125, 0.098052978515625, 0.22259521484375, 0.347137451171875, 0.4716796875, 0.596221923828125, 0.72076416015625, 0.845306396484375, 0.9698486328125, 1.094390869140625, 1.21893310546875, 1.343475341796875, 1.468017578125, 1.592559814453125, 1.71710205078125, 1.841644287109375, 1.9661865234375, 2.090728759765625, 2.21527099609375, 2.339813232421875, 2.46435546875, 2.588897705078125, 2.71343994140625, 2.837982177734375, 2.9625244140625, 3.087066650390625, 3.21160888671875, 3.336151123046875, 3.460693359375, 3.585235595703125, 3.70977783203125, 3.834320068359375, 3.9588623046875, 4.083404541015625, 4.20794677734375, 4.332489013671875, 4.45703125]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 17.0, 21.0, 32.0, 39.0, 84.0, 108.0, 155.0, 237.0, 555.0, 3187.0, 217870.0, 816914.0, 7771.0, 798.0, 253.0, 190.0, 116.0, 72.0, 43.0, 34.0, 22.0, 9.0, 8.0, 8.0, 6.0, 4.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.3125, -10.06781005859375, -9.8231201171875, -9.57843017578125, -9.333740234375, -9.08905029296875, -8.8443603515625, -8.59967041015625, -8.35498046875, -8.11029052734375, -7.8656005859375, -7.62091064453125, -7.376220703125, -7.13153076171875, -6.8868408203125, -6.64215087890625, -6.3974609375, -6.15277099609375, -5.9080810546875, -5.66339111328125, -5.418701171875, -5.17401123046875, -4.9293212890625, -4.68463134765625, -4.43994140625, -4.19525146484375, -3.9505615234375, -3.70587158203125, -3.461181640625, -3.21649169921875, -2.9718017578125, -2.72711181640625, -2.482421875, -2.23773193359375, -1.9930419921875, -1.74835205078125, -1.503662109375, -1.25897216796875, -1.0142822265625, -0.76959228515625, -0.52490234375, -0.28021240234375, -0.0355224609375, 0.20916748046875, 0.453857421875, 0.69854736328125, 0.9432373046875, 1.18792724609375, 1.4326171875, 1.67730712890625, 1.9219970703125, 2.16668701171875, 2.411376953125, 2.65606689453125, 2.9007568359375, 3.14544677734375, 3.39013671875, 3.63482666015625, 3.8795166015625, 4.12420654296875, 4.368896484375, 4.61358642578125, 4.8582763671875, 5.10296630859375, 5.34765625]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 4.0, 12.0, 5.0, 6.0, 8.0, 7.0, 16.0, 12.0, 29.0, 29.0, 19.0, 24.0, 40.0, 41.0, 49.0, 44.0, 37.0, 56.0, 66.0, 48.0, 42.0, 50.0, 57.0, 37.0, 37.0, 44.0, 29.0, 30.0, 29.0, 26.0, 20.0, 13.0, 10.0, 13.0, 8.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.01171875, -4.86651611328125, -4.7213134765625, -4.57611083984375, -4.430908203125, -4.28570556640625, -4.1405029296875, -3.99530029296875, -3.85009765625, -3.70489501953125, -3.5596923828125, -3.41448974609375, -3.269287109375, -3.12408447265625, -2.9788818359375, -2.83367919921875, -2.6884765625, -2.54327392578125, -2.3980712890625, -2.25286865234375, -2.107666015625, -1.96246337890625, -1.8172607421875, -1.67205810546875, -1.52685546875, -1.38165283203125, -1.2364501953125, -1.09124755859375, -0.946044921875, -0.80084228515625, -0.6556396484375, -0.51043701171875, -0.365234375, -0.22003173828125, -0.0748291015625, 0.07037353515625, 0.215576171875, 0.36077880859375, 0.5059814453125, 0.65118408203125, 0.79638671875, 0.94158935546875, 1.0867919921875, 1.23199462890625, 1.377197265625, 1.52239990234375, 1.6676025390625, 1.81280517578125, 1.9580078125, 2.10321044921875, 2.2484130859375, 2.39361572265625, 2.538818359375, 2.68402099609375, 2.8292236328125, 2.97442626953125, 3.11962890625, 3.26483154296875, 3.4100341796875, 3.55523681640625, 3.700439453125, 3.84564208984375, 3.9908447265625, 4.13604736328125, 4.28125]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 2.0, 4.0, 4.0, 4.0, 3.0, 3.0, 9.0, 9.0, 9.0, 18.0, 31.0, 45.0, 80.0, 187.0, 397.0, 1134.0, 3920.0, 23560.0, 897257.0, 112314.0, 6647.0, 1795.0, 585.0, 254.0, 101.0, 58.0, 36.0, 24.0, 14.0, 11.0, 4.0, 8.0, 5.0, 4.0, 2.0, 1.0, 6.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-2.537109375, -2.459503173828125, -2.38189697265625, -2.304290771484375, -2.2266845703125, -2.149078369140625, -2.07147216796875, -1.993865966796875, -1.916259765625, -1.838653564453125, -1.76104736328125, -1.683441162109375, -1.6058349609375, -1.528228759765625, -1.45062255859375, -1.373016357421875, -1.29541015625, -1.217803955078125, -1.14019775390625, -1.062591552734375, -0.9849853515625, -0.907379150390625, -0.82977294921875, -0.752166748046875, -0.674560546875, -0.596954345703125, -0.51934814453125, -0.441741943359375, -0.3641357421875, -0.286529541015625, -0.20892333984375, -0.131317138671875, -0.0537109375, 0.023895263671875, 0.10150146484375, 0.179107666015625, 0.2567138671875, 0.334320068359375, 0.41192626953125, 0.489532470703125, 0.567138671875, 0.644744873046875, 0.72235107421875, 0.799957275390625, 0.8775634765625, 0.955169677734375, 1.03277587890625, 1.110382080078125, 1.18798828125, 1.265594482421875, 1.34320068359375, 1.420806884765625, 1.4984130859375, 1.576019287109375, 1.65362548828125, 1.731231689453125, 1.808837890625, 1.886444091796875, 1.96405029296875, 2.041656494140625, 2.1192626953125, 2.196868896484375, 2.27447509765625, 2.352081298828125, 2.4296875]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 7.0, 26.0, 39.0, 73.0, 171.0, 334.0, 177.0, 95.0, 45.0, 17.0, 10.0, 3.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.0006976127624511719, -0.000683516263961792, -0.0006694197654724121, -0.0006553232669830322, -0.0006412267684936523, -0.0006271302700042725, -0.0006130337715148926, -0.0005989372730255127, -0.0005848407745361328, -0.0005707442760467529, -0.000556647777557373, -0.0005425512790679932, -0.0005284547805786133, -0.0005143582820892334, -0.0005002617835998535, -0.00048616528511047363, -0.00047206878662109375, -0.00045797228813171387, -0.000443875789642334, -0.0004297792911529541, -0.0004156827926635742, -0.00040158629417419434, -0.00038748979568481445, -0.00037339329719543457, -0.0003592967987060547, -0.0003452003002166748, -0.0003311038017272949, -0.00031700730323791504, -0.00030291080474853516, -0.0002888143062591553, -0.0002747178077697754, -0.0002606213092803955, -0.0002465248107910156, -0.00023242831230163574, -0.00021833181381225586, -0.00020423531532287598, -0.0001901388168334961, -0.0001760423183441162, -0.00016194581985473633, -0.00014784932136535645, -0.00013375282287597656, -0.00011965632438659668, -0.0001055598258972168, -9.146332740783691e-05, -7.736682891845703e-05, -6.327033042907715e-05, -4.9173831939697266e-05, -3.507733345031738e-05, -2.09808349609375e-05, -6.884336471557617e-06, 7.212162017822266e-06, 2.130866050720215e-05, 3.540515899658203e-05, 4.9501657485961914e-05, 6.35981559753418e-05, 7.769465446472168e-05, 9.179115295410156e-05, 0.00010588765144348145, 0.00011998414993286133, 0.0001340806484222412, 0.0001481771469116211, 0.00016227364540100098, 0.00017637014389038086, 0.00019046664237976074, 0.00020456314086914062]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 5.0, 4.0, 5.0, 4.0, 6.0, 9.0, 12.0, 5.0, 12.0, 29.0, 60.0, 94.0, 166.0, 402.0, 1000.0, 4329.0, 64989.0, 941860.0, 30881.0, 3203.0, 779.0, 336.0, 162.0, 92.0, 41.0, 19.0, 17.0, 12.0, 10.0, 7.0, 3.0, 1.0, 5.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.408203125, -2.320343017578125, -2.23248291015625, -2.144622802734375, -2.0567626953125, -1.968902587890625, -1.88104248046875, -1.793182373046875, -1.705322265625, -1.617462158203125, -1.52960205078125, -1.441741943359375, -1.3538818359375, -1.266021728515625, -1.17816162109375, -1.090301513671875, -1.00244140625, -0.914581298828125, -0.82672119140625, -0.738861083984375, -0.6510009765625, -0.563140869140625, -0.47528076171875, -0.387420654296875, -0.299560546875, -0.211700439453125, -0.12384033203125, -0.035980224609375, 0.0518798828125, 0.139739990234375, 0.22760009765625, 0.315460205078125, 0.4033203125, 0.491180419921875, 0.57904052734375, 0.666900634765625, 0.7547607421875, 0.842620849609375, 0.93048095703125, 1.018341064453125, 1.106201171875, 1.194061279296875, 1.28192138671875, 1.369781494140625, 1.4576416015625, 1.545501708984375, 1.63336181640625, 1.721221923828125, 1.80908203125, 1.896942138671875, 1.98480224609375, 2.072662353515625, 2.1605224609375, 2.248382568359375, 2.33624267578125, 2.424102783203125, 2.511962890625, 2.599822998046875, 2.68768310546875, 2.775543212890625, 2.8634033203125, 2.951263427734375, 3.03912353515625, 3.126983642578125, 3.21484375]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 3.0, 8.0, 2.0, 12.0, 10.0, 10.0, 15.0, 19.0, 28.0, 46.0, 48.0, 76.0, 87.0, 117.0, 108.0, 74.0, 69.0, 62.0, 48.0, 39.0, 23.0, 21.0, 11.0, 15.0, 7.0, 6.0, 4.0, 0.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.37353515625, -0.3606605529785156, -0.34778594970703125, -0.3349113464355469, -0.3220367431640625, -0.3091621398925781, -0.29628753662109375, -0.2834129333496094, -0.270538330078125, -0.2576637268066406, -0.24478912353515625, -0.23191452026367188, -0.2190399169921875, -0.20616531372070312, -0.19329071044921875, -0.18041610717773438, -0.16754150390625, -0.15466690063476562, -0.14179229736328125, -0.12891769409179688, -0.1160430908203125, -0.10316848754882812, -0.09029388427734375, -0.07741928100585938, -0.064544677734375, -0.051670074462890625, -0.03879547119140625, -0.025920867919921875, -0.0130462646484375, -0.000171661376953125, 0.01270294189453125, 0.025577545166015625, 0.0384521484375, 0.051326751708984375, 0.06420135498046875, 0.07707595825195312, 0.0899505615234375, 0.10282516479492188, 0.11569976806640625, 0.12857437133789062, 0.141448974609375, 0.15432357788085938, 0.16719818115234375, 0.18007278442382812, 0.1929473876953125, 0.20582199096679688, 0.21869659423828125, 0.23157119750976562, 0.24444580078125, 0.2573204040527344, 0.27019500732421875, 0.2830696105957031, 0.2959442138671875, 0.3088188171386719, 0.32169342041015625, 0.3345680236816406, 0.347442626953125, 0.3603172302246094, 0.37319183349609375, 0.3860664367675781, 0.3989410400390625, 0.4118156433105469, 0.42469024658203125, 0.4375648498535156, 0.450439453125]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 8.0, 11.0, 13.0, 46.0, 69.0, 111.0, 161.0, 150.0, 176.0, 114.0, 66.0, 51.0, 13.0, 11.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.608284950256348, -8.32614803314209, -8.044010162353516, -7.7618727684021, -7.479735374450684, -7.197598457336426, -6.91546106338501, -6.633323669433594, -6.351186275482178, -6.069048881530762, -5.786911487579346, -5.50477409362793, -5.222637176513672, -4.940499305725098, -4.65836238861084, -4.376224994659424, -4.094087600708008, -3.811950206756592, -3.529812812805176, -3.247675657272339, -2.965538263320923, -2.683400869369507, -2.40126371383667, -2.119126319885254, -1.836988925933838, -1.5548515319824219, -1.2727142572402954, -0.9905769228935242, -0.7084395885467529, -0.4263021945953369, -0.14416491985321045, 0.13797235488891602, 0.4201087951660156, 0.7022461295127869, 0.9843834638595581, 1.2665207386016846, 1.5486581325531006, 1.8307955265045166, 2.1129326820373535, 2.3950700759887695, 2.6772074699401855, 2.9593448638916016, 3.2414822578430176, 3.5236194133758545, 3.8057568073272705, 4.087894439697266, 4.370031356811523, 4.6521687507629395, 4.9343061447143555, 5.2164435386657715, 5.4985809326171875, 5.7807183265686035, 6.0628557205200195, 6.344992637634277, 6.627130031585693, 6.909267425537109, 7.191404819488525, 7.473542213439941, 7.755679607391357, 8.037817001342773, 8.319953918457031, 8.602091789245605, 8.884228706359863, 9.166366577148438, 9.448503494262695]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 3.0, 1.0, 6.0, 4.0, 7.0, 13.0, 16.0, 11.0, 18.0, 16.0, 20.0, 30.0, 29.0, 28.0, 28.0, 26.0, 38.0, 44.0, 44.0, 37.0, 32.0, 46.0, 32.0, 46.0, 43.0, 33.0, 46.0, 38.0, 43.0, 34.0, 30.0, 23.0, 28.0, 16.0, 12.0, 21.0, 10.0, 13.0, 10.0, 6.0, 6.0, 4.0, 4.0, 8.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.823061943054199, -5.629883289337158, -5.436705112457275, -5.243526458740234, -5.050347805023193, -4.857169151306152, -4.6639909744262695, -4.4708123207092285, -4.2776336669921875, -4.0844550132751465, -3.8912765979766846, -3.6980981826782227, -3.5049195289611816, -3.3117411136627197, -3.118562698364258, -2.925384044647217, -2.732205629348755, -2.539027214050293, -2.345848560333252, -2.15267014503479, -1.959491491317749, -1.766313076019287, -1.5731345415115356, -1.3799560070037842, -1.1867774724960327, -0.9935989379882812, -0.8004204034805298, -0.6072419285774231, -0.41406339406967163, -0.22088485956192017, -0.027706384658813477, 0.165472149848938, 0.35865068435668945, 0.5518292188644409, 0.7450077533721924, 0.9381862282752991, 1.1313648223876953, 1.3245432376861572, 1.5177217721939087, 1.7109003067016602, 1.9040788412094116, 2.097257375717163, 2.290435791015625, 2.483614444732666, 2.676792860031128, 2.869971513748169, 3.063149929046631, 3.256328582763672, 3.449506998062134, 3.6426854133605957, 3.8358640670776367, 4.029042720794678, 4.2222208976745605, 4.415399551391602, 4.608578205108643, 4.801756858825684, 4.994935035705566, 5.188113689422607, 5.38129186630249, 5.574470520019531, 5.767649173736572, 5.960827827453613, 6.154006004333496, 6.347184658050537, 6.540363311767578]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 7.0, 7.0, 5.0, 13.0, 21.0, 30.0, 41.0, 67.0, 109.0, 186.0, 267.0, 505.0, 950.0, 2857.0, 25749.0, 1092606.0, 2979991.0, 83981.0, 4663.0, 1034.0, 437.0, 252.0, 165.0, 113.0, 73.0, 47.0, 33.0, 22.0, 23.0, 15.0, 3.0, 5.0, 2.0, 2.0, 3.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.98046875, -6.7762451171875, -6.572021484375, -6.3677978515625, -6.16357421875, -5.9593505859375, -5.755126953125, -5.5509033203125, -5.3466796875, -5.1424560546875, -4.938232421875, -4.7340087890625, -4.52978515625, -4.3255615234375, -4.121337890625, -3.9171142578125, -3.712890625, -3.5086669921875, -3.304443359375, -3.1002197265625, -2.89599609375, -2.6917724609375, -2.487548828125, -2.2833251953125, -2.0791015625, -1.8748779296875, -1.670654296875, -1.4664306640625, -1.26220703125, -1.0579833984375, -0.853759765625, -0.6495361328125, -0.4453125, -0.2410888671875, -0.036865234375, 0.1673583984375, 0.37158203125, 0.5758056640625, 0.780029296875, 0.9842529296875, 1.1884765625, 1.3927001953125, 1.596923828125, 1.8011474609375, 2.00537109375, 2.2095947265625, 2.413818359375, 2.6180419921875, 2.822265625, 3.0264892578125, 3.230712890625, 3.4349365234375, 3.63916015625, 3.8433837890625, 4.047607421875, 4.2518310546875, 4.4560546875, 4.6602783203125, 4.864501953125, 5.0687255859375, 5.27294921875, 5.4771728515625, 5.681396484375, 5.8856201171875, 6.08984375]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 5.0, 3.0, 3.0, 6.0, 5.0, 9.0, 20.0, 19.0, 22.0, 25.0, 41.0, 42.0, 50.0, 58.0, 54.0, 73.0, 74.0, 73.0, 70.0, 69.0, 61.0, 51.0, 49.0, 44.0, 24.0, 17.0, 15.0, 7.0, 8.0, 9.0, 1.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.91015625, -1.8138427734375, -1.717529296875, -1.6212158203125, -1.52490234375, -1.4285888671875, -1.332275390625, -1.2359619140625, -1.1396484375, -1.0433349609375, -0.947021484375, -0.8507080078125, -0.75439453125, -0.6580810546875, -0.561767578125, -0.4654541015625, -0.369140625, -0.2728271484375, -0.176513671875, -0.0802001953125, 0.01611328125, 0.1124267578125, 0.208740234375, 0.3050537109375, 0.4013671875, 0.4976806640625, 0.593994140625, 0.6903076171875, 0.78662109375, 0.8829345703125, 0.979248046875, 1.0755615234375, 1.171875, 1.2681884765625, 1.364501953125, 1.4608154296875, 1.55712890625, 1.6534423828125, 1.749755859375, 1.8460693359375, 1.9423828125, 2.0386962890625, 2.135009765625, 2.2313232421875, 2.32763671875, 2.4239501953125, 2.520263671875, 2.6165771484375, 2.712890625, 2.8092041015625, 2.905517578125, 3.0018310546875, 3.09814453125, 3.1944580078125, 3.290771484375, 3.3870849609375, 3.4833984375, 3.5797119140625, 3.676025390625, 3.7723388671875, 3.86865234375, 3.9649658203125, 4.061279296875, 4.1575927734375, 4.25390625]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 2.0, 6.0, 5.0, 9.0, 17.0, 10.0, 26.0, 42.0, 66.0, 104.0, 176.0, 332.0, 636.0, 1563.0, 4192.0, 18862.0, 257975.0, 3484585.0, 392401.0, 24794.0, 5067.0, 1736.0, 798.0, 349.0, 198.0, 116.0, 68.0, 38.0, 35.0, 17.0, 16.0, 15.0, 12.0, 5.0, 2.0, 3.0, 5.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.970703125, -2.832916259765625, -2.69512939453125, -2.557342529296875, -2.4195556640625, -2.281768798828125, -2.14398193359375, -2.006195068359375, -1.868408203125, -1.730621337890625, -1.59283447265625, -1.455047607421875, -1.3172607421875, -1.179473876953125, -1.04168701171875, -0.903900146484375, -0.76611328125, -0.628326416015625, -0.49053955078125, -0.352752685546875, -0.2149658203125, -0.077178955078125, 0.06060791015625, 0.198394775390625, 0.336181640625, 0.473968505859375, 0.61175537109375, 0.749542236328125, 0.8873291015625, 1.025115966796875, 1.16290283203125, 1.300689697265625, 1.4384765625, 1.576263427734375, 1.71405029296875, 1.851837158203125, 1.9896240234375, 2.127410888671875, 2.26519775390625, 2.402984619140625, 2.540771484375, 2.678558349609375, 2.81634521484375, 2.954132080078125, 3.0919189453125, 3.229705810546875, 3.36749267578125, 3.505279541015625, 3.64306640625, 3.780853271484375, 3.91864013671875, 4.056427001953125, 4.1942138671875, 4.332000732421875, 4.46978759765625, 4.607574462890625, 4.745361328125, 4.883148193359375, 5.02093505859375, 5.158721923828125, 5.2965087890625, 5.434295654296875, 5.57208251953125, 5.709869384765625, 5.84765625]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 4.0, 2.0, 2.0, 7.0, 7.0, 4.0, 9.0, 16.0, 15.0, 33.0, 41.0, 63.0, 88.0, 122.0, 174.0, 255.0, 353.0, 465.0, 504.0, 504.0, 464.0, 296.0, 203.0, 133.0, 95.0, 63.0, 48.0, 35.0, 20.0, 18.0, 8.0, 3.0, 9.0, 3.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.2001953125, -1.1699066162109375, -1.139617919921875, -1.1093292236328125, -1.07904052734375, -1.0487518310546875, -1.018463134765625, -0.9881744384765625, -0.9578857421875, -0.9275970458984375, -0.897308349609375, -0.8670196533203125, -0.83673095703125, -0.8064422607421875, -0.776153564453125, -0.7458648681640625, -0.715576171875, -0.6852874755859375, -0.654998779296875, -0.6247100830078125, -0.59442138671875, -0.5641326904296875, -0.533843994140625, -0.5035552978515625, -0.4732666015625, -0.4429779052734375, -0.412689208984375, -0.3824005126953125, -0.35211181640625, -0.3218231201171875, -0.291534423828125, -0.2612457275390625, -0.23095703125, -0.2006683349609375, -0.170379638671875, -0.1400909423828125, -0.10980224609375, -0.0795135498046875, -0.049224853515625, -0.0189361572265625, 0.0113525390625, 0.0416412353515625, 0.071929931640625, 0.1022186279296875, 0.13250732421875, 0.1627960205078125, 0.193084716796875, 0.2233734130859375, 0.253662109375, 0.2839508056640625, 0.314239501953125, 0.3445281982421875, 0.37481689453125, 0.4051055908203125, 0.435394287109375, 0.4656829833984375, 0.4959716796875, 0.5262603759765625, 0.556549072265625, 0.5868377685546875, 0.61712646484375, 0.6474151611328125, 0.677703857421875, 0.7079925537109375, 0.73828125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 14.0, 17.0, 30.0, 55.0, 86.0, 135.0, 148.0, 125.0, 135.0, 115.0, 50.0, 43.0, 18.0, 14.0, 12.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3709821701049805, -5.174742221832275, -4.97850227355957, -4.782262802124023, -4.586022853851318, -4.389782905578613, -4.193542957305908, -3.997303009033203, -3.801063060760498, -3.604823112487793, -3.408583402633667, -3.212343454360962, -3.016103506088257, -2.819863796234131, -2.623623847961426, -2.4273838996887207, -2.2311441898345947, -2.0349042415618896, -1.8386644124984741, -1.6424245834350586, -1.4461846351623535, -1.249944806098938, -1.0537049770355225, -0.8574650287628174, -0.6612251996994019, -0.46498531103134155, -0.26874545216560364, -0.07250559329986572, 0.12373429536819458, 0.3199741840362549, 0.5162140130996704, 0.7124539613723755, 0.908693790435791, 1.1049336194992065, 1.3011735677719116, 1.4974133968353271, 1.6936533451080322, 1.8898931741714478, 2.0861330032348633, 2.2823729515075684, 2.4786128997802734, 2.6748528480529785, 2.8710925579071045, 3.0673325061798096, 3.2635724544525146, 3.4598121643066406, 3.6560521125793457, 3.852292060852051, 4.048531532287598, 4.244771480560303, 4.441011428833008, 4.637250900268555, 4.83349084854126, 5.029730796813965, 5.22597074508667, 5.422210693359375, 5.61845064163208, 5.814690589904785, 6.01093053817749, 6.207170486450195, 6.403409957885742, 6.599649906158447, 6.795889854431152, 6.992129802703857, 7.1883697509765625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 2.0, 3.0, 5.0, 9.0, 7.0, 10.0, 10.0, 9.0, 12.0, 15.0, 21.0, 22.0, 34.0, 28.0, 42.0, 34.0, 27.0, 46.0, 39.0, 57.0, 44.0, 48.0, 41.0, 62.0, 50.0, 37.0, 34.0, 43.0, 38.0, 22.0, 24.0, 26.0, 14.0, 17.0, 12.0, 12.0, 12.0, 9.0, 6.0, 4.0, 7.0, 7.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.063088893890381, -1.9899500608444214, -1.916811227798462, -1.8436723947525024, -1.770533561706543, -1.697394609451294, -1.6242557764053345, -1.551116943359375, -1.4779781103134155, -1.404839277267456, -1.3317004442214966, -1.258561611175537, -1.185422658920288, -1.1122839450836182, -1.0391449928283691, -0.9660061597824097, -0.8928673267364502, -0.8197284936904907, -0.7465896606445312, -0.673450767993927, -0.6003119349479675, -0.5271731019020081, -0.4540342390537262, -0.38089537620544434, -0.30775654315948486, -0.2346176952123642, -0.16147884726524353, -0.08833999931812286, -0.015201151371002197, 0.057937681674957275, 0.13107654452323914, 0.204215407371521, 0.27735424041748047, 0.35049307346343994, 0.4236319363117218, 0.49677079916000366, 0.5699096322059631, 0.6430484652519226, 0.7161873579025269, 0.7893261909484863, 0.8624650239944458, 0.9356038570404053, 1.0087426900863647, 1.0818815231323242, 1.1550204753875732, 1.2281591892242432, 1.3012981414794922, 1.3744369745254517, 1.4475758075714111, 1.5207146406173706, 1.59385347366333, 1.6669923067092896, 1.740131139755249, 1.813270092010498, 1.8864089250564575, 1.959547758102417, 2.032686710357666, 2.105825662612915, 2.178964376449585, 2.252103328704834, 2.325242042541504, 2.398380994796753, 2.471519708633423, 2.544658660888672, 2.617797374725342]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 5.0, 9.0, 8.0, 6.0, 8.0, 16.0, 19.0, 25.0, 29.0, 66.0, 107.0, 162.0, 249.0, 451.0, 741.0, 1430.0, 3065.0, 6910.0, 16624.0, 43500.0, 125590.0, 310545.0, 324384.0, 135526.0, 47493.0, 17652.0, 7229.0, 3170.0, 1560.0, 793.0, 456.0, 246.0, 156.0, 84.0, 79.0, 53.0, 36.0, 20.0, 11.0, 15.0, 9.0, 9.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.424072265625, -0.4099540710449219, -0.39583587646484375, -0.3817176818847656, -0.3675994873046875, -0.3534812927246094, -0.33936309814453125, -0.3252449035644531, -0.311126708984375, -0.2970085144042969, -0.28289031982421875, -0.2687721252441406, -0.2546539306640625, -0.24053573608398438, -0.22641754150390625, -0.21229934692382812, -0.19818115234375, -0.18406295776367188, -0.16994476318359375, -0.15582656860351562, -0.1417083740234375, -0.12759017944335938, -0.11347198486328125, -0.09935379028320312, -0.085235595703125, -0.07111740112304688, -0.05699920654296875, -0.042881011962890625, -0.0287628173828125, -0.014644622802734375, -0.00052642822265625, 0.013591766357421875, 0.0277099609375, 0.041828155517578125, 0.05594635009765625, 0.07006454467773438, 0.0841827392578125, 0.09830093383789062, 0.11241912841796875, 0.12653732299804688, 0.140655517578125, 0.15477371215820312, 0.16889190673828125, 0.18301010131835938, 0.1971282958984375, 0.21124649047851562, 0.22536468505859375, 0.23948287963867188, 0.25360107421875, 0.2677192687988281, 0.28183746337890625, 0.2959556579589844, 0.3100738525390625, 0.3241920471191406, 0.33831024169921875, 0.3524284362792969, 0.366546630859375, 0.3806648254394531, 0.39478302001953125, 0.4089012145996094, 0.4230194091796875, 0.4371376037597656, 0.45125579833984375, 0.4653739929199219, 0.4794921875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 8.0, 2.0, 2.0, 7.0, 10.0, 7.0, 15.0, 9.0, 26.0, 23.0, 22.0, 18.0, 33.0, 36.0, 43.0, 37.0, 49.0, 48.0, 51.0, 49.0, 59.0, 52.0, 36.0, 46.0, 47.0, 50.0, 31.0, 29.0, 26.0, 22.0, 15.0, 15.0, 18.0, 13.0, 8.0, 5.0, 12.0, 5.0, 5.0, 7.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5244140625, -1.4734344482421875, -1.422454833984375, -1.3714752197265625, -1.32049560546875, -1.2695159912109375, -1.218536376953125, -1.1675567626953125, -1.1165771484375, -1.0655975341796875, -1.014617919921875, -0.9636383056640625, -0.91265869140625, -0.8616790771484375, -0.810699462890625, -0.7597198486328125, -0.708740234375, -0.6577606201171875, -0.606781005859375, -0.5558013916015625, -0.50482177734375, -0.4538421630859375, -0.402862548828125, -0.3518829345703125, -0.3009033203125, -0.2499237060546875, -0.198944091796875, -0.1479644775390625, -0.09698486328125, -0.0460052490234375, 0.004974365234375, 0.0559539794921875, 0.10693359375, 0.1579132080078125, 0.208892822265625, 0.2598724365234375, 0.31085205078125, 0.3618316650390625, 0.412811279296875, 0.4637908935546875, 0.5147705078125, 0.5657501220703125, 0.616729736328125, 0.6677093505859375, 0.71868896484375, 0.7696685791015625, 0.820648193359375, 0.8716278076171875, 0.922607421875, 0.9735870361328125, 1.024566650390625, 1.0755462646484375, 1.12652587890625, 1.1775054931640625, 1.228485107421875, 1.2794647216796875, 1.3304443359375, 1.3814239501953125, 1.432403564453125, 1.4833831787109375, 1.53436279296875, 1.5853424072265625, 1.636322021484375, 1.6873016357421875, 1.73828125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 10.0, 8.0, 17.0, 22.0, 33.0, 38.0, 58.0, 82.0, 128.0, 207.0, 321.0, 514.0, 850.0, 1251.0, 2073.0, 3647.0, 5992.0, 9830.0, 16471.0, 27862.0, 46777.0, 76564.0, 120267.0, 164654.0, 178530.0, 145444.0, 97520.0, 59992.0, 35978.0, 21432.0, 12702.0, 7763.0, 4612.0, 2736.0, 1598.0, 1021.0, 561.0, 334.0, 238.0, 145.0, 100.0, 58.0, 51.0, 31.0, 10.0, 10.0, 5.0, 7.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.1871337890625, -0.18150711059570312, -0.17588043212890625, -0.17025375366210938, -0.1646270751953125, -0.15900039672851562, -0.15337371826171875, -0.14774703979492188, -0.142120361328125, -0.13649368286132812, -0.13086700439453125, -0.12524032592773438, -0.1196136474609375, -0.11398696899414062, -0.10836029052734375, -0.10273361206054688, -0.09710693359375, -0.09148025512695312, -0.08585357666015625, -0.08022689819335938, -0.0746002197265625, -0.06897354125976562, -0.06334686279296875, -0.057720184326171875, -0.052093505859375, -0.046466827392578125, -0.04084014892578125, -0.035213470458984375, -0.0295867919921875, -0.023960113525390625, -0.01833343505859375, -0.012706756591796875, -0.007080078125, -0.001453399658203125, 0.00417327880859375, 0.009799957275390625, 0.0154266357421875, 0.021053314208984375, 0.02667999267578125, 0.032306671142578125, 0.037933349609375, 0.043560028076171875, 0.04918670654296875, 0.054813385009765625, 0.0604400634765625, 0.06606674194335938, 0.07169342041015625, 0.07732009887695312, 0.08294677734375, 0.08857345581054688, 0.09420013427734375, 0.09982681274414062, 0.1054534912109375, 0.11108016967773438, 0.11670684814453125, 0.12233352661132812, 0.127960205078125, 0.13358688354492188, 0.13921356201171875, 0.14484024047851562, 0.1504669189453125, 0.15609359741210938, 0.16172027587890625, 0.16734695434570312, 0.1729736328125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 6.0, 4.0, 4.0, 7.0, 10.0, 9.0, 12.0, 15.0, 19.0, 19.0, 22.0, 24.0, 28.0, 41.0, 31.0, 41.0, 41.0, 56.0, 51.0, 53.0, 53.0, 49.0, 47.0, 48.0, 41.0, 38.0, 36.0, 44.0, 30.0, 24.0, 23.0, 21.0, 12.0, 11.0, 8.0, 12.0, 6.0, 5.0, 3.0, 5.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.794921875, -3.69366455078125, -3.5924072265625, -3.49114990234375, -3.389892578125, -3.28863525390625, -3.1873779296875, -3.08612060546875, -2.98486328125, -2.88360595703125, -2.7823486328125, -2.68109130859375, -2.579833984375, -2.47857666015625, -2.3773193359375, -2.27606201171875, -2.1748046875, -2.07354736328125, -1.9722900390625, -1.87103271484375, -1.769775390625, -1.66851806640625, -1.5672607421875, -1.46600341796875, -1.36474609375, -1.26348876953125, -1.1622314453125, -1.06097412109375, -0.959716796875, -0.85845947265625, -0.7572021484375, -0.65594482421875, -0.5546875, -0.45343017578125, -0.3521728515625, -0.25091552734375, -0.149658203125, -0.04840087890625, 0.0528564453125, 0.15411376953125, 0.25537109375, 0.35662841796875, 0.4578857421875, 0.55914306640625, 0.660400390625, 0.76165771484375, 0.8629150390625, 0.96417236328125, 1.0654296875, 1.16668701171875, 1.2679443359375, 1.36920166015625, 1.470458984375, 1.57171630859375, 1.6729736328125, 1.77423095703125, 1.87548828125, 1.97674560546875, 2.0780029296875, 2.17926025390625, 2.280517578125, 2.38177490234375, 2.4830322265625, 2.58428955078125, 2.685546875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 5.0, 6.0, 11.0, 13.0, 35.0, 37.0, 72.0, 124.0, 218.0, 368.0, 790.0, 1735.0, 5217.0, 20397.0, 113813.0, 479533.0, 342577.0, 64532.0, 12596.0, 3742.0, 1310.0, 635.0, 338.0, 196.0, 108.0, 63.0, 31.0, 20.0, 15.0, 10.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.07769775390625, -0.07569742202758789, -0.07369709014892578, -0.07169675827026367, -0.06969642639160156, -0.06769609451293945, -0.06569576263427734, -0.06369543075561523, -0.061695098876953125, -0.059694766998291016, -0.057694435119628906, -0.0556941032409668, -0.05369377136230469, -0.05169343948364258, -0.04969310760498047, -0.04769277572631836, -0.04569244384765625, -0.04369211196899414, -0.04169178009033203, -0.03969144821166992, -0.03769111633300781, -0.0356907844543457, -0.033690452575683594, -0.031690120697021484, -0.029689788818359375, -0.027689456939697266, -0.025689125061035156, -0.023688793182373047, -0.021688461303710938, -0.019688129425048828, -0.01768779754638672, -0.01568746566772461, -0.0136871337890625, -0.01168680191040039, -0.009686470031738281, -0.007686138153076172, -0.0056858062744140625, -0.003685474395751953, -0.0016851425170898438, 0.0003151893615722656, 0.002315521240234375, 0.004315853118896484, 0.006316184997558594, 0.008316516876220703, 0.010316848754882812, 0.012317180633544922, 0.014317512512207031, 0.01631784439086914, 0.01831817626953125, 0.02031850814819336, 0.02231884002685547, 0.024319171905517578, 0.026319503784179688, 0.028319835662841797, 0.030320167541503906, 0.032320499420166016, 0.034320831298828125, 0.036321163177490234, 0.038321495056152344, 0.04032182693481445, 0.04232215881347656, 0.04432249069213867, 0.04632282257080078, 0.04832315444946289, 0.050323486328125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 7.0, 4.0, 6.0, 11.0, 16.0, 19.0, 37.0, 37.0, 65.0, 62.0, 83.0, 118.0, 110.0, 86.0, 79.0, 59.0, 49.0, 46.0, 26.0, 22.0, 13.0, 9.0, 13.0, 12.0, 2.0, 6.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.553794860839844e-05, -4.435330629348755e-05, -4.316866397857666e-05, -4.198402166366577e-05, -4.079937934875488e-05, -3.9614737033843994e-05, -3.8430094718933105e-05, -3.724545240402222e-05, -3.606081008911133e-05, -3.487616777420044e-05, -3.369152545928955e-05, -3.250688314437866e-05, -3.1322240829467773e-05, -3.0137598514556885e-05, -2.8952956199645996e-05, -2.7768313884735107e-05, -2.658367156982422e-05, -2.539902925491333e-05, -2.421438694000244e-05, -2.3029744625091553e-05, -2.1845102310180664e-05, -2.0660459995269775e-05, -1.9475817680358887e-05, -1.8291175365447998e-05, -1.710653305053711e-05, -1.592189073562622e-05, -1.4737248420715332e-05, -1.3552606105804443e-05, -1.2367963790893555e-05, -1.1183321475982666e-05, -9.998679161071777e-06, -8.814036846160889e-06, -7.62939453125e-06, -6.444752216339111e-06, -5.260109901428223e-06, -4.075467586517334e-06, -2.8908252716064453e-06, -1.7061829566955566e-06, -5.21540641784668e-07, 6.631016731262207e-07, 1.8477439880371094e-06, 3.032386302947998e-06, 4.217028617858887e-06, 5.401670932769775e-06, 6.586313247680664e-06, 7.770955562591553e-06, 8.955597877502441e-06, 1.014024019241333e-05, 1.1324882507324219e-05, 1.2509524822235107e-05, 1.3694167137145996e-05, 1.4878809452056885e-05, 1.6063451766967773e-05, 1.7248094081878662e-05, 1.843273639678955e-05, 1.961737871170044e-05, 2.0802021026611328e-05, 2.1986663341522217e-05, 2.3171305656433105e-05, 2.4355947971343994e-05, 2.5540590286254883e-05, 2.672523260116577e-05, 2.790987491607666e-05, 2.909451723098755e-05, 3.0279159545898438e-05]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 4.0, 3.0, 9.0, 9.0, 13.0, 25.0, 34.0, 42.0, 81.0, 88.0, 149.0, 282.0, 426.0, 941.0, 1921.0, 4753.0, 13187.0, 43405.0, 157966.0, 396853.0, 297443.0, 90721.0, 25866.0, 8244.0, 3096.0, 1378.0, 664.0, 349.0, 195.0, 150.0, 76.0, 61.0, 36.0, 24.0, 17.0, 11.0, 8.0, 10.0, 2.0, 4.0, 3.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.04205322265625, -0.04064130783081055, -0.039229393005371094, -0.03781747817993164, -0.03640556335449219, -0.034993648529052734, -0.03358173370361328, -0.03216981887817383, -0.030757904052734375, -0.029345989227294922, -0.02793407440185547, -0.026522159576416016, -0.025110244750976562, -0.02369832992553711, -0.022286415100097656, -0.020874500274658203, -0.01946258544921875, -0.018050670623779297, -0.016638755798339844, -0.01522684097290039, -0.013814926147460938, -0.012403011322021484, -0.010991096496582031, -0.009579181671142578, -0.008167266845703125, -0.006755352020263672, -0.005343437194824219, -0.003931522369384766, -0.0025196075439453125, -0.0011076927185058594, 0.00030422210693359375, 0.0017161369323730469, 0.0031280517578125, 0.004539966583251953, 0.005951881408691406, 0.007363796234130859, 0.008775711059570312, 0.010187625885009766, 0.011599540710449219, 0.013011455535888672, 0.014423370361328125, 0.015835285186767578, 0.01724720001220703, 0.018659114837646484, 0.020071029663085938, 0.02148294448852539, 0.022894859313964844, 0.024306774139404297, 0.02571868896484375, 0.027130603790283203, 0.028542518615722656, 0.02995443344116211, 0.03136634826660156, 0.032778263092041016, 0.03419017791748047, 0.03560209274291992, 0.037014007568359375, 0.03842592239379883, 0.03983783721923828, 0.041249752044677734, 0.04266166687011719, 0.04407358169555664, 0.045485496520996094, 0.04689741134643555, 0.048309326171875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 2.0, 5.0, 3.0, 9.0, 12.0, 16.0, 23.0, 19.0, 16.0, 35.0, 40.0, 56.0, 58.0, 83.0, 66.0, 86.0, 69.0, 65.0, 60.0, 61.0, 53.0, 41.0, 28.0, 22.0, 17.0, 11.0, 8.0, 5.0, 7.0, 8.0, 0.0, 4.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.014617919921875, -0.01419830322265625, -0.0137786865234375, -0.01335906982421875, -0.012939453125, -0.01251983642578125, -0.0121002197265625, -0.01168060302734375, -0.011260986328125, -0.01084136962890625, -0.0104217529296875, -0.01000213623046875, -0.00958251953125, -0.00916290283203125, -0.0087432861328125, -0.00832366943359375, -0.007904052734375, -0.00748443603515625, -0.0070648193359375, -0.00664520263671875, -0.0062255859375, -0.00580596923828125, -0.0053863525390625, -0.00496673583984375, -0.004547119140625, -0.00412750244140625, -0.0037078857421875, -0.00328826904296875, -0.00286865234375, -0.00244903564453125, -0.0020294189453125, -0.00160980224609375, -0.001190185546875, -0.00077056884765625, -0.0003509521484375, 6.866455078125e-05, 0.00048828125, 0.00090789794921875, 0.0013275146484375, 0.00174713134765625, 0.002166748046875, 0.00258636474609375, 0.0030059814453125, 0.00342559814453125, 0.00384521484375, 0.00426483154296875, 0.0046844482421875, 0.00510406494140625, 0.005523681640625, 0.00594329833984375, 0.0063629150390625, 0.00678253173828125, 0.0072021484375, 0.00762176513671875, 0.0080413818359375, 0.00846099853515625, 0.008880615234375, 0.00930023193359375, 0.0097198486328125, 0.01013946533203125, 0.01055908203125, 0.01097869873046875, 0.0113983154296875, 0.01181793212890625, 0.012237548828125]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 8.0, 15.0, 38.0, 84.0, 152.0, 198.0, 176.0, 159.0, 104.0, 28.0, 26.0, 5.0, 6.0, 4.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.076685905456543, -4.9233880043029785, -4.770089626312256, -4.616791725158691, -4.463493347167969, -4.310195446014404, -4.15689754486084, -4.003599166870117, -3.8503012657165527, -3.697003126144409, -3.5437049865722656, -3.390407085418701, -3.2371089458465576, -3.083810806274414, -2.9305129051208496, -2.777214765548706, -2.6239166259765625, -2.470618486404419, -2.3173203468322754, -2.164022445678711, -2.0107243061065674, -1.8574261665344238, -1.7041281461715698, -1.5508301258087158, -1.3975319862365723, -1.2442338466644287, -1.0909358263015747, -0.9376377463340759, -0.7843396663665771, -0.6310415863990784, -0.4777435064315796, -0.3244454860687256, -0.17114734649658203, -0.017849266529083252, 0.13544881343841553, 0.2887468934059143, 0.4420449733734131, 0.5953430533409119, 0.7486411333084106, 0.9019391536712646, 1.0552372932434082, 1.2085354328155518, 1.3618334531784058, 1.5151314735412598, 1.6684296131134033, 1.8217277526855469, 1.9750257730484009, 2.128323793411255, 2.2816219329833984, 2.434920072555542, 2.5882182121276855, 2.74151611328125, 2.8948142528533936, 3.048112392425537, 3.2014102935791016, 3.354708433151245, 3.5080065727233887, 3.6613047122955322, 3.814602851867676, 3.9679007530212402, 4.121198654174805, 4.274497032165527, 4.427794933319092, 4.581092834472656, 4.734391212463379]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 5.0, 4.0, 5.0, 4.0, 4.0, 10.0, 15.0, 10.0, 17.0, 14.0, 24.0, 31.0, 36.0, 39.0, 41.0, 46.0, 44.0, 56.0, 58.0, 60.0, 47.0, 73.0, 59.0, 35.0, 48.0, 36.0, 31.0, 29.0, 26.0, 24.0, 16.0, 12.0, 8.0, 8.0, 9.0, 5.0, 9.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.5080432891845703, -1.4532721042633057, -1.398500919342041, -1.3437297344207764, -1.2889585494995117, -1.234187364578247, -1.1794160604476929, -1.1246448755264282, -1.0698736906051636, -1.015102505683899, -0.9603313207626343, -0.9055600762367249, -0.8507888913154602, -0.7960177063941956, -0.7412464618682861, -0.6864752769470215, -0.6317040920257568, -0.5769329071044922, -0.5221617221832275, -0.4673904776573181, -0.41261929273605347, -0.3578481078147888, -0.3030768930912018, -0.24830567836761475, -0.1935344934463501, -0.13876329362392426, -0.08399209380149841, -0.02922089397907257, 0.02555030584335327, 0.08032149076461792, 0.13509270548820496, 0.189863920211792, 0.24463510513305664, 0.2994062900543213, 0.3541775047779083, 0.40894871950149536, 0.46371990442276, 0.5184910893440247, 0.5732623338699341, 0.6280335187911987, 0.6828047037124634, 0.737575888633728, 0.7923470735549927, 0.8471183180809021, 0.9018895030021667, 0.9566606879234314, 1.0114319324493408, 1.0662031173706055, 1.1209743022918701, 1.1757454872131348, 1.2305166721343994, 1.285287857055664, 1.3400590419769287, 1.3948302268981934, 1.4496015310287476, 1.5043727159500122, 1.5591439008712769, 1.6139150857925415, 1.6686862707138062, 1.7234574556350708, 1.778228759765625, 1.8329999446868896, 1.8877711296081543, 1.942542314529419, 1.9973134994506836]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 2.0, 1.0, 4.0, 4.0, 6.0, 9.0, 12.0, 12.0, 18.0, 25.0, 34.0, 60.0, 85.0, 182.0, 364.0, 799.0, 2041.0, 6928.0, 27566.0, 143249.0, 701292.0, 130325.0, 25625.0, 6441.0, 1952.0, 726.0, 325.0, 189.0, 108.0, 61.0, 30.0, 27.0, 17.0, 12.0, 8.0, 6.0, 8.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.87109375, -2.7901611328125, -2.709228515625, -2.6282958984375, -2.54736328125, -2.4664306640625, -2.385498046875, -2.3045654296875, -2.2236328125, -2.1427001953125, -2.061767578125, -1.9808349609375, -1.89990234375, -1.8189697265625, -1.738037109375, -1.6571044921875, -1.576171875, -1.4952392578125, -1.414306640625, -1.3333740234375, -1.25244140625, -1.1715087890625, -1.090576171875, -1.0096435546875, -0.9287109375, -0.8477783203125, -0.766845703125, -0.6859130859375, -0.60498046875, -0.5240478515625, -0.443115234375, -0.3621826171875, -0.28125, -0.2003173828125, -0.119384765625, -0.0384521484375, 0.04248046875, 0.1234130859375, 0.204345703125, 0.2852783203125, 0.3662109375, 0.4471435546875, 0.528076171875, 0.6090087890625, 0.68994140625, 0.7708740234375, 0.851806640625, 0.9327392578125, 1.013671875, 1.0946044921875, 1.175537109375, 1.2564697265625, 1.33740234375, 1.4183349609375, 1.499267578125, 1.5802001953125, 1.6611328125, 1.7420654296875, 1.822998046875, 1.9039306640625, 1.98486328125, 2.0657958984375, 2.146728515625, 2.2276611328125, 2.30859375]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 6.0, 10.0, 8.0, 8.0, 7.0, 19.0, 14.0, 10.0, 28.0, 24.0, 29.0, 33.0, 47.0, 37.0, 44.0, 48.0, 54.0, 67.0, 49.0, 55.0, 49.0, 49.0, 46.0, 37.0, 44.0, 27.0, 27.0, 30.0, 10.0, 23.0, 17.0, 13.0, 7.0, 9.0, 6.0, 7.0, 2.0, 5.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.91015625, -2.803558349609375, -2.69696044921875, -2.590362548828125, -2.4837646484375, -2.377166748046875, -2.27056884765625, -2.163970947265625, -2.057373046875, -1.950775146484375, -1.84417724609375, -1.737579345703125, -1.6309814453125, -1.524383544921875, -1.41778564453125, -1.311187744140625, -1.20458984375, -1.097991943359375, -0.99139404296875, -0.884796142578125, -0.7781982421875, -0.671600341796875, -0.56500244140625, -0.458404541015625, -0.351806640625, -0.245208740234375, -0.13861083984375, -0.032012939453125, 0.0745849609375, 0.181182861328125, 0.28778076171875, 0.394378662109375, 0.5009765625, 0.607574462890625, 0.71417236328125, 0.820770263671875, 0.9273681640625, 1.033966064453125, 1.14056396484375, 1.247161865234375, 1.353759765625, 1.460357666015625, 1.56695556640625, 1.673553466796875, 1.7801513671875, 1.886749267578125, 1.99334716796875, 2.099945068359375, 2.20654296875, 2.313140869140625, 2.41973876953125, 2.526336669921875, 2.6329345703125, 2.739532470703125, 2.84613037109375, 2.952728271484375, 3.059326171875, 3.165924072265625, 3.27252197265625, 3.379119873046875, 3.4857177734375, 3.592315673828125, 3.69891357421875, 3.805511474609375, 3.912109375]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 5.0, 2.0, 5.0, 9.0, 12.0, 7.0, 23.0, 26.0, 26.0, 35.0, 50.0, 84.0, 85.0, 148.0, 201.0, 297.0, 526.0, 1388.0, 11388.0, 460406.0, 558440.0, 12294.0, 1496.0, 538.0, 291.0, 206.0, 159.0, 98.0, 78.0, 45.0, 42.0, 41.0, 22.0, 21.0, 16.0, 14.0, 5.0, 10.0, 8.0, 3.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.625, -5.46435546875, -5.3037109375, -5.14306640625, -4.982421875, -4.82177734375, -4.6611328125, -4.50048828125, -4.33984375, -4.17919921875, -4.0185546875, -3.85791015625, -3.697265625, -3.53662109375, -3.3759765625, -3.21533203125, -3.0546875, -2.89404296875, -2.7333984375, -2.57275390625, -2.412109375, -2.25146484375, -2.0908203125, -1.93017578125, -1.76953125, -1.60888671875, -1.4482421875, -1.28759765625, -1.126953125, -0.96630859375, -0.8056640625, -0.64501953125, -0.484375, -0.32373046875, -0.1630859375, -0.00244140625, 0.158203125, 0.31884765625, 0.4794921875, 0.64013671875, 0.80078125, 0.96142578125, 1.1220703125, 1.28271484375, 1.443359375, 1.60400390625, 1.7646484375, 1.92529296875, 2.0859375, 2.24658203125, 2.4072265625, 2.56787109375, 2.728515625, 2.88916015625, 3.0498046875, 3.21044921875, 3.37109375, 3.53173828125, 3.6923828125, 3.85302734375, 4.013671875, 4.17431640625, 4.3349609375, 4.49560546875, 4.65625]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 8.0, 5.0, 5.0, 6.0, 4.0, 3.0, 9.0, 11.0, 10.0, 17.0, 17.0, 10.0, 18.0, 18.0, 38.0, 27.0, 39.0, 41.0, 39.0, 47.0, 61.0, 57.0, 60.0, 49.0, 54.0, 44.0, 33.0, 37.0, 34.0, 24.0, 28.0, 26.0, 19.0, 19.0, 18.0, 12.0, 10.0, 11.0, 13.0, 9.0, 7.0, 3.0, 1.0, 4.0, 2.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.90234375, -3.784698486328125, -3.66705322265625, -3.549407958984375, -3.4317626953125, -3.314117431640625, -3.19647216796875, -3.078826904296875, -2.961181640625, -2.843536376953125, -2.72589111328125, -2.608245849609375, -2.4906005859375, -2.372955322265625, -2.25531005859375, -2.137664794921875, -2.02001953125, -1.902374267578125, -1.78472900390625, -1.667083740234375, -1.5494384765625, -1.431793212890625, -1.31414794921875, -1.196502685546875, -1.078857421875, -0.961212158203125, -0.84356689453125, -0.725921630859375, -0.6082763671875, -0.490631103515625, -0.37298583984375, -0.255340576171875, -0.1376953125, -0.020050048828125, 0.09759521484375, 0.215240478515625, 0.3328857421875, 0.450531005859375, 0.56817626953125, 0.685821533203125, 0.803466796875, 0.921112060546875, 1.03875732421875, 1.156402587890625, 1.2740478515625, 1.391693115234375, 1.50933837890625, 1.626983642578125, 1.74462890625, 1.862274169921875, 1.97991943359375, 2.097564697265625, 2.2152099609375, 2.332855224609375, 2.45050048828125, 2.568145751953125, 2.685791015625, 2.803436279296875, 2.92108154296875, 3.038726806640625, 3.1563720703125, 3.274017333984375, 3.39166259765625, 3.509307861328125, 3.626953125]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 7.0, 3.0, 19.0, 25.0, 76.0, 152.0, 382.0, 968.0, 7065.0, 1010370.0, 27230.0, 1484.0, 458.0, 167.0, 78.0, 26.0, 12.0, 6.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.169921875, -3.050933837890625, -2.93194580078125, -2.812957763671875, -2.6939697265625, -2.574981689453125, -2.45599365234375, -2.337005615234375, -2.218017578125, -2.099029541015625, -1.98004150390625, -1.861053466796875, -1.7420654296875, -1.623077392578125, -1.50408935546875, -1.385101318359375, -1.26611328125, -1.147125244140625, -1.02813720703125, -0.909149169921875, -0.7901611328125, -0.671173095703125, -0.55218505859375, -0.433197021484375, -0.314208984375, -0.195220947265625, -0.07623291015625, 0.042755126953125, 0.1617431640625, 0.280731201171875, 0.39971923828125, 0.518707275390625, 0.6376953125, 0.756683349609375, 0.87567138671875, 0.994659423828125, 1.1136474609375, 1.232635498046875, 1.35162353515625, 1.470611572265625, 1.589599609375, 1.708587646484375, 1.82757568359375, 1.946563720703125, 2.0655517578125, 2.184539794921875, 2.30352783203125, 2.422515869140625, 2.54150390625, 2.660491943359375, 2.77947998046875, 2.898468017578125, 3.0174560546875, 3.136444091796875, 3.25543212890625, 3.374420166015625, 3.493408203125, 3.612396240234375, 3.73138427734375, 3.850372314453125, 3.9693603515625, 4.088348388671875, 4.20733642578125, 4.326324462890625, 4.4453125]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 9.0, 11.0, 8.0, 19.0, 21.0, 32.0, 46.0, 83.0, 174.0, 302.0, 100.0, 61.0, 43.0, 26.0, 28.0, 10.0, 15.0, 7.0, 3.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0002713203430175781, -0.00026402994990348816, -0.0002567395567893982, -0.00024944916367530823, -0.00024215877056121826, -0.0002348683774471283, -0.00022757798433303833, -0.00022028759121894836, -0.0002129971981048584, -0.00020570680499076843, -0.00019841641187667847, -0.0001911260187625885, -0.00018383562564849854, -0.00017654523253440857, -0.0001692548394203186, -0.00016196444630622864, -0.00015467405319213867, -0.0001473836600780487, -0.00014009326696395874, -0.00013280287384986877, -0.0001255124807357788, -0.00011822208762168884, -0.00011093169450759888, -0.00010364130139350891, -9.635090827941895e-05, -8.906051516532898e-05, -8.177012205123901e-05, -7.447972893714905e-05, -6.718933582305908e-05, -5.9898942708969116e-05, -5.260854959487915e-05, -4.5318156480789185e-05, -3.802776336669922e-05, -3.073737025260925e-05, -2.3446977138519287e-05, -1.615658402442932e-05, -8.866190910339355e-06, -1.5757977962493896e-06, 5.714595317840576e-06, 1.3004988431930542e-05, 2.0295381546020508e-05, 2.7585774660110474e-05, 3.487616777420044e-05, 4.2166560888290405e-05, 4.945695400238037e-05, 5.674734711647034e-05, 6.40377402305603e-05, 7.132813334465027e-05, 7.861852645874023e-05, 8.59089195728302e-05, 9.319931268692017e-05, 0.00010048970580101013, 0.0001077800989151001, 0.00011507049202919006, 0.00012236088514328003, 0.00012965127825737, 0.00013694167137145996, 0.00014423206448554993, 0.0001515224575996399, 0.00015881285071372986, 0.00016610324382781982, 0.0001733936369419098, 0.00018068403005599976, 0.00018797442317008972, 0.0001952648162841797]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 6.0, 17.0, 12.0, 30.0, 55.0, 103.0, 229.0, 482.0, 1334.0, 18131.0, 1011387.0, 14615.0, 1215.0, 495.0, 198.0, 101.0, 63.0, 32.0, 18.0, 12.0, 9.0, 1.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.18359375, -4.062255859375, -3.94091796875, -3.819580078125, -3.6982421875, -3.576904296875, -3.45556640625, -3.334228515625, -3.212890625, -3.091552734375, -2.97021484375, -2.848876953125, -2.7275390625, -2.606201171875, -2.48486328125, -2.363525390625, -2.2421875, -2.120849609375, -1.99951171875, -1.878173828125, -1.7568359375, -1.635498046875, -1.51416015625, -1.392822265625, -1.271484375, -1.150146484375, -1.02880859375, -0.907470703125, -0.7861328125, -0.664794921875, -0.54345703125, -0.422119140625, -0.30078125, -0.179443359375, -0.05810546875, 0.063232421875, 0.1845703125, 0.305908203125, 0.42724609375, 0.548583984375, 0.669921875, 0.791259765625, 0.91259765625, 1.033935546875, 1.1552734375, 1.276611328125, 1.39794921875, 1.519287109375, 1.640625, 1.761962890625, 1.88330078125, 2.004638671875, 2.1259765625, 2.247314453125, 2.36865234375, 2.489990234375, 2.611328125, 2.732666015625, 2.85400390625, 2.975341796875, 3.0966796875, 3.218017578125, 3.33935546875, 3.460693359375, 3.58203125]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 6.0, 10.0, 33.0, 51.0, 89.0, 383.0, 279.0, 89.0, 39.0, 16.0, 9.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9375, -0.8998260498046875, -0.862152099609375, -0.8244781494140625, -0.78680419921875, -0.7491302490234375, -0.711456298828125, -0.6737823486328125, -0.6361083984375, -0.5984344482421875, -0.560760498046875, -0.5230865478515625, -0.48541259765625, -0.4477386474609375, -0.410064697265625, -0.3723907470703125, -0.334716796875, -0.2970428466796875, -0.259368896484375, -0.2216949462890625, -0.18402099609375, -0.1463470458984375, -0.108673095703125, -0.0709991455078125, -0.0333251953125, 0.0043487548828125, 0.042022705078125, 0.0796966552734375, 0.11737060546875, 0.1550445556640625, 0.192718505859375, 0.2303924560546875, 0.26806640625, 0.3057403564453125, 0.343414306640625, 0.3810882568359375, 0.41876220703125, 0.4564361572265625, 0.494110107421875, 0.5317840576171875, 0.5694580078125, 0.6071319580078125, 0.644805908203125, 0.6824798583984375, 0.72015380859375, 0.7578277587890625, 0.795501708984375, 0.8331756591796875, 0.870849609375, 0.9085235595703125, 0.946197509765625, 0.9838714599609375, 1.02154541015625, 1.0592193603515625, 1.096893310546875, 1.1345672607421875, 1.1722412109375, 1.2099151611328125, 1.247589111328125, 1.2852630615234375, 1.32293701171875, 1.3606109619140625, 1.398284912109375, 1.4359588623046875, 1.4736328125]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 6.0, 8.0, 10.0, 23.0, 31.0, 55.0, 98.0, 110.0, 123.0, 140.0, 127.0, 100.0, 74.0, 34.0, 30.0, 13.0, 10.0, 3.0, 2.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.202199935913086, -7.987643718719482, -7.773087501525879, -7.558531284332275, -7.343975067138672, -7.129419326782227, -6.914863109588623, -6.7003068923950195, -6.485750675201416, -6.2711944580078125, -6.056638240814209, -5.8420820236206055, -5.62752628326416, -5.412969589233398, -5.198413848876953, -4.98385763168335, -4.769301414489746, -4.554745197296143, -4.340188980102539, -4.1256327629089355, -3.911076784133911, -3.6965205669403076, -3.481964588165283, -3.2674083709716797, -3.052852153778076, -2.8382959365844727, -2.623739719390869, -2.4091837406158447, -2.194627523422241, -1.9800713062286377, -1.7655152082443237, -1.5509591102600098, -1.336402416229248, -1.1218461990356445, -0.9072901010513306, -0.6927339434623718, -0.4781777858734131, -0.26362156867980957, -0.049065470695495605, 0.16549062728881836, 0.3800468444824219, 0.5946030020713806, 0.8091591596603394, 1.0237152576446533, 1.2382714748382568, 1.4528276920318604, 1.6673837900161743, 1.8819398880004883, 2.096496105194092, 2.3110523223876953, 2.525608539581299, 2.7401645183563232, 2.9547207355499268, 3.1692769527435303, 3.3838329315185547, 3.598389148712158, 3.8129453659057617, 4.027501583099365, 4.242057800292969, 4.456614017486572, 4.671170234680176, 4.885725975036621, 5.100282192230225, 5.314838409423828, 5.529394626617432]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 8.0, 4.0, 6.0, 13.0, 7.0, 10.0, 7.0, 7.0, 18.0, 12.0, 27.0, 21.0, 29.0, 29.0, 45.0, 32.0, 37.0, 36.0, 40.0, 43.0, 40.0, 43.0, 51.0, 42.0, 39.0, 31.0, 37.0, 37.0, 34.0, 33.0, 24.0, 29.0, 27.0, 24.0, 11.0, 20.0, 11.0, 6.0, 7.0, 7.0, 5.0, 6.0, 4.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.1834845542907715, -5.010655403137207, -4.837826251983643, -4.664997100830078, -4.4921674728393555, -4.319338321685791, -4.146509170532227, -3.973680019378662, -3.8008508682250977, -3.628021717071533, -3.4551925659179688, -3.282363176345825, -3.1095340251922607, -2.9367048740386963, -2.7638754844665527, -2.5910463333129883, -2.418217182159424, -2.2453880310058594, -2.072558879852295, -1.8997294902801514, -1.726900339126587, -1.5540711879730225, -1.3812419176101685, -1.2084126472473145, -1.03558349609375, -0.8627542853355408, -0.6899250745773315, -0.5170958638191223, -0.3442666530609131, -0.17143744230270386, 0.001391768455505371, 0.17422103881835938, 0.34705066680908203, 0.5198798775672913, 0.6927090883255005, 0.8655382990837097, 1.038367509841919, 1.2111966609954834, 1.3840259313583374, 1.5568552017211914, 1.7296843528747559, 1.9025135040283203, 2.0753426551818848, 2.2481720447540283, 2.4210011959075928, 2.5938303470611572, 2.766659736633301, 2.9394888877868652, 3.1123180389404297, 3.285147190093994, 3.4579763412475586, 3.630805730819702, 3.8036348819732666, 3.976464033126831, 4.149293422698975, 4.322122573852539, 4.4949517250061035, 4.667780876159668, 4.840610027313232, 5.013439178466797, 5.1862688064575195, 5.359097957611084, 5.531927108764648, 5.704756259918213, 5.877585411071777]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 5.0, 3.0, 9.0, 13.0, 5.0, 18.0, 27.0, 20.0, 23.0, 27.0, 48.0, 44.0, 79.0, 130.0, 299.0, 1302.0, 72392.0, 4094661.0, 23782.0, 776.0, 223.0, 94.0, 71.0, 43.0, 47.0, 37.0, 21.0, 20.0, 10.0, 14.0, 8.0, 7.0, 6.0, 7.0, 7.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-14.6796875, -14.26513671875, -13.8505859375, -13.43603515625, -13.021484375, -12.60693359375, -12.1923828125, -11.77783203125, -11.36328125, -10.94873046875, -10.5341796875, -10.11962890625, -9.705078125, -9.29052734375, -8.8759765625, -8.46142578125, -8.046875, -7.63232421875, -7.2177734375, -6.80322265625, -6.388671875, -5.97412109375, -5.5595703125, -5.14501953125, -4.73046875, -4.31591796875, -3.9013671875, -3.48681640625, -3.072265625, -2.65771484375, -2.2431640625, -1.82861328125, -1.4140625, -0.99951171875, -0.5849609375, -0.17041015625, 0.244140625, 0.65869140625, 1.0732421875, 1.48779296875, 1.90234375, 2.31689453125, 2.7314453125, 3.14599609375, 3.560546875, 3.97509765625, 4.3896484375, 4.80419921875, 5.21875, 5.63330078125, 6.0478515625, 6.46240234375, 6.876953125, 7.29150390625, 7.7060546875, 8.12060546875, 8.53515625, 8.94970703125, 9.3642578125, 9.77880859375, 10.193359375, 10.60791015625, 11.0224609375, 11.43701171875, 11.8515625]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 2.0, 4.0, 9.0, 10.0, 2.0, 16.0, 17.0, 15.0, 18.0, 21.0, 27.0, 33.0, 38.0, 51.0, 57.0, 54.0, 47.0, 59.0, 59.0, 49.0, 56.0, 60.0, 48.0, 38.0, 37.0, 39.0, 22.0, 14.0, 20.0, 14.0, 15.0, 9.0, 5.0, 13.0, 7.0, 5.0, 5.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.12109375, -2.057586669921875, -1.99407958984375, -1.930572509765625, -1.8670654296875, -1.803558349609375, -1.74005126953125, -1.676544189453125, -1.613037109375, -1.549530029296875, -1.48602294921875, -1.422515869140625, -1.3590087890625, -1.295501708984375, -1.23199462890625, -1.168487548828125, -1.10498046875, -1.041473388671875, -0.97796630859375, -0.914459228515625, -0.8509521484375, -0.787445068359375, -0.72393798828125, -0.660430908203125, -0.596923828125, -0.533416748046875, -0.46990966796875, -0.406402587890625, -0.3428955078125, -0.279388427734375, -0.21588134765625, -0.152374267578125, -0.0888671875, -0.025360107421875, 0.03814697265625, 0.101654052734375, 0.1651611328125, 0.228668212890625, 0.29217529296875, 0.355682373046875, 0.419189453125, 0.482696533203125, 0.54620361328125, 0.609710693359375, 0.6732177734375, 0.736724853515625, 0.80023193359375, 0.863739013671875, 0.92724609375, 0.990753173828125, 1.05426025390625, 1.117767333984375, 1.1812744140625, 1.244781494140625, 1.30828857421875, 1.371795654296875, 1.435302734375, 1.498809814453125, 1.56231689453125, 1.625823974609375, 1.6893310546875, 1.752838134765625, 1.81634521484375, 1.879852294921875, 1.943359375]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 2.0, 4.0, 6.0, 6.0, 9.0, 14.0, 20.0, 36.0, 65.0, 103.0, 203.0, 489.0, 1254.0, 4519.0, 39863.0, 2429501.0, 1681106.0, 31047.0, 4004.0, 1155.0, 413.0, 212.0, 101.0, 51.0, 44.0, 15.0, 11.0, 9.0, 3.0, 6.0, 4.0, 1.0, 4.0, 1.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.82421875, -5.6419677734375, -5.459716796875, -5.2774658203125, -5.09521484375, -4.9129638671875, -4.730712890625, -4.5484619140625, -4.3662109375, -4.1839599609375, -4.001708984375, -3.8194580078125, -3.63720703125, -3.4549560546875, -3.272705078125, -3.0904541015625, -2.908203125, -2.7259521484375, -2.543701171875, -2.3614501953125, -2.17919921875, -1.9969482421875, -1.814697265625, -1.6324462890625, -1.4501953125, -1.2679443359375, -1.085693359375, -0.9034423828125, -0.72119140625, -0.5389404296875, -0.356689453125, -0.1744384765625, 0.0078125, 0.1900634765625, 0.372314453125, 0.5545654296875, 0.73681640625, 0.9190673828125, 1.101318359375, 1.2835693359375, 1.4658203125, 1.6480712890625, 1.830322265625, 2.0125732421875, 2.19482421875, 2.3770751953125, 2.559326171875, 2.7415771484375, 2.923828125, 3.1060791015625, 3.288330078125, 3.4705810546875, 3.65283203125, 3.8350830078125, 4.017333984375, 4.1995849609375, 4.3818359375, 4.5640869140625, 4.746337890625, 4.9285888671875, 5.11083984375, 5.2930908203125, 5.475341796875, 5.6575927734375, 5.83984375]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 7.0, 7.0, 9.0, 25.0, 30.0, 38.0, 66.0, 86.0, 152.0, 218.0, 331.0, 523.0, 651.0, 593.0, 442.0, 302.0, 197.0, 133.0, 88.0, 57.0, 38.0, 18.0, 17.0, 14.0, 10.0, 7.0, 3.0, 4.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1474609375, -1.1125030517578125, -1.077545166015625, -1.0425872802734375, -1.00762939453125, -0.9726715087890625, -0.937713623046875, -0.9027557373046875, -0.8677978515625, -0.8328399658203125, -0.797882080078125, -0.7629241943359375, -0.72796630859375, -0.6930084228515625, -0.658050537109375, -0.6230926513671875, -0.588134765625, -0.5531768798828125, -0.518218994140625, -0.4832611083984375, -0.44830322265625, -0.4133453369140625, -0.378387451171875, -0.3434295654296875, -0.3084716796875, -0.2735137939453125, -0.238555908203125, -0.2035980224609375, -0.16864013671875, -0.1336822509765625, -0.098724365234375, -0.0637664794921875, -0.02880859375, 0.0061492919921875, 0.041107177734375, 0.0760650634765625, 0.11102294921875, 0.1459808349609375, 0.180938720703125, 0.2158966064453125, 0.2508544921875, 0.2858123779296875, 0.320770263671875, 0.3557281494140625, 0.39068603515625, 0.4256439208984375, 0.460601806640625, 0.4955596923828125, 0.530517578125, 0.5654754638671875, 0.600433349609375, 0.6353912353515625, 0.67034912109375, 0.7053070068359375, 0.740264892578125, 0.7752227783203125, 0.8101806640625, 0.8451385498046875, 0.880096435546875, 0.9150543212890625, 0.95001220703125, 0.9849700927734375, 1.019927978515625, 1.0548858642578125, 1.08984375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 6.0, 7.0, 28.0, 39.0, 65.0, 101.0, 137.0, 158.0, 145.0, 111.0, 101.0, 49.0, 34.0, 14.0, 10.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6952319145202637, -3.508453845977783, -3.3216757774353027, -3.134897470474243, -2.9481194019317627, -2.7613413333892822, -2.5745630264282227, -2.387784957885742, -2.2010068893432617, -2.0142288208007812, -1.8274506330490112, -1.6406724452972412, -1.4538943767547607, -1.2671163082122803, -1.0803381204605103, -0.8935599327087402, -0.7067818641662598, -0.5200037360191345, -0.3332256078720093, -0.14644747972488403, 0.04033064842224121, 0.22710877656936646, 0.4138869047164917, 0.6006650924682617, 0.7874431610107422, 0.9742212891578674, 1.1609994173049927, 1.3477776050567627, 1.5345556735992432, 1.7213337421417236, 1.9081119298934937, 2.0948901176452637, 2.281667709350586, 2.4684457778930664, 2.655223846435547, 2.8420021533966064, 3.028780221939087, 3.2155582904815674, 3.402336597442627, 3.5891146659851074, 3.775892734527588, 3.9626708030700684, 4.149448871612549, 4.336226940155029, 4.523005485534668, 4.709783554077148, 4.896561622619629, 5.083339691162109, 5.27011775970459, 5.45689582824707, 5.643673896789551, 5.830451965332031, 6.017230033874512, 6.20400857925415, 6.390786647796631, 6.577564716339111, 6.764342784881592, 6.951120853424072, 7.137898921966553, 7.324676990509033, 7.511455535888672, 7.698233604431152, 7.885011672973633, 8.071789741516113, 8.258567810058594]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 3.0, 5.0, 7.0, 5.0, 8.0, 17.0, 12.0, 12.0, 21.0, 17.0, 25.0, 21.0, 23.0, 30.0, 25.0, 49.0, 55.0, 45.0, 52.0, 43.0, 37.0, 46.0, 50.0, 52.0, 39.0, 46.0, 37.0, 32.0, 36.0, 29.0, 29.0, 25.0, 13.0, 13.0, 8.0, 8.0, 8.0, 8.0, 4.0, 8.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.0219712257385254, -1.9532334804534912, -1.8844958543777466, -1.8157581090927124, -1.7470204830169678, -1.6782827377319336, -1.6095449924468994, -1.5408072471618652, -1.4720696210861206, -1.4033318758010864, -1.3345942497253418, -1.2658565044403076, -1.1971187591552734, -1.1283811330795288, -1.0596433877944946, -0.9909057021141052, -0.9221680164337158, -0.8534303307533264, -0.784692645072937, -0.7159548997879028, -0.6472172141075134, -0.578479528427124, -0.5097417831420898, -0.44100409746170044, -0.37226641178131104, -0.30352872610092163, -0.23479101061820984, -0.16605331003665924, -0.09731560945510864, -0.02857792377471924, 0.040159791707992554, 0.10889750719070435, 0.17763495445251465, 0.24637265503406525, 0.31511035561561584, 0.38384807109832764, 0.45258575677871704, 0.5213234424591064, 0.5900611877441406, 0.65879887342453, 0.7275365591049194, 0.7962742447853088, 0.8650119304656982, 0.9337496757507324, 1.0024874210357666, 1.0712250471115112, 1.1399627923965454, 1.20870041847229, 1.2774381637573242, 1.3461759090423584, 1.414913535118103, 1.4836512804031372, 1.5523889064788818, 1.621126651763916, 1.6898643970489502, 1.7586021423339844, 1.827339768409729, 1.8960775136947632, 1.9648151397705078, 2.033552885055542, 2.102290630340576, 2.1710281372070312, 2.2397658824920654, 2.3085036277770996, 2.377241373062134]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 8.0, 12.0, 14.0, 32.0, 41.0, 66.0, 111.0, 190.0, 331.0, 701.0, 1812.0, 6256.0, 33787.0, 248185.0, 598606.0, 132926.0, 18843.0, 4152.0, 1288.0, 530.0, 272.0, 134.0, 100.0, 53.0, 33.0, 28.0, 20.0, 4.0, 4.0, 3.0, 5.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.86474609375, -0.8342361450195312, -0.8037261962890625, -0.7732162475585938, -0.742706298828125, -0.7121963500976562, -0.6816864013671875, -0.6511764526367188, -0.62066650390625, -0.5901565551757812, -0.5596466064453125, -0.5291366577148438, -0.498626708984375, -0.46811676025390625, -0.4376068115234375, -0.40709686279296875, -0.3765869140625, -0.34607696533203125, -0.3155670166015625, -0.28505706787109375, -0.254547119140625, -0.22403717041015625, -0.1935272216796875, -0.16301727294921875, -0.13250732421875, -0.10199737548828125, -0.0714874267578125, -0.04097747802734375, -0.010467529296875, 0.02004241943359375, 0.0505523681640625, 0.08106231689453125, 0.111572265625, 0.14208221435546875, 0.1725921630859375, 0.20310211181640625, 0.233612060546875, 0.26412200927734375, 0.2946319580078125, 0.32514190673828125, 0.35565185546875, 0.38616180419921875, 0.4166717529296875, 0.44718170166015625, 0.477691650390625, 0.5082015991210938, 0.5387115478515625, 0.5692214965820312, 0.5997314453125, 0.6302413940429688, 0.6607513427734375, 0.6912612915039062, 0.721771240234375, 0.7522811889648438, 0.7827911376953125, 0.8133010864257812, 0.84381103515625, 0.8743209838867188, 0.9048309326171875, 0.9353408813476562, 0.965850830078125, 0.9963607788085938, 1.0268707275390625, 1.0573806762695312, 1.087890625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 4.0, 6.0, 9.0, 10.0, 18.0, 27.0, 21.0, 32.0, 45.0, 45.0, 64.0, 79.0, 70.0, 80.0, 86.0, 65.0, 60.0, 61.0, 70.0, 46.0, 28.0, 21.0, 17.0, 14.0, 15.0, 7.0, 5.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.1328125, -3.054229736328125, -2.97564697265625, -2.897064208984375, -2.8184814453125, -2.739898681640625, -2.66131591796875, -2.582733154296875, -2.504150390625, -2.425567626953125, -2.34698486328125, -2.268402099609375, -2.1898193359375, -2.111236572265625, -2.03265380859375, -1.954071044921875, -1.87548828125, -1.796905517578125, -1.71832275390625, -1.639739990234375, -1.5611572265625, -1.482574462890625, -1.40399169921875, -1.325408935546875, -1.246826171875, -1.168243408203125, -1.08966064453125, -1.011077880859375, -0.9324951171875, -0.853912353515625, -0.77532958984375, -0.696746826171875, -0.6181640625, -0.539581298828125, -0.46099853515625, -0.382415771484375, -0.3038330078125, -0.225250244140625, -0.14666748046875, -0.068084716796875, 0.010498046875, 0.089080810546875, 0.16766357421875, 0.246246337890625, 0.3248291015625, 0.403411865234375, 0.48199462890625, 0.560577392578125, 0.63916015625, 0.717742919921875, 0.79632568359375, 0.874908447265625, 0.9534912109375, 1.032073974609375, 1.11065673828125, 1.189239501953125, 1.267822265625, 1.346405029296875, 1.42498779296875, 1.503570556640625, 1.5821533203125, 1.660736083984375, 1.73931884765625, 1.817901611328125, 1.896484375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 6.0, 10.0, 13.0, 21.0, 39.0, 33.0, 56.0, 95.0, 118.0, 173.0, 256.0, 357.0, 565.0, 843.0, 1262.0, 1876.0, 2722.0, 4250.0, 6307.0, 9607.0, 14447.0, 21771.0, 32311.0, 48222.0, 70842.0, 99730.0, 128798.0, 144234.0, 132018.0, 101849.0, 73226.0, 50424.0, 33735.0, 22576.0, 15534.0, 9932.0, 6742.0, 4385.0, 2963.0, 2028.0, 1306.0, 942.0, 624.0, 412.0, 291.0, 192.0, 141.0, 83.0, 60.0, 43.0, 33.0, 26.0, 13.0, 11.0, 6.0, 2.0, 4.0, 2.0, 2.0, 1.0], "bins": [-0.1531982421875, -0.1483440399169922, -0.14348983764648438, -0.13863563537597656, -0.13378143310546875, -0.12892723083496094, -0.12407302856445312, -0.11921882629394531, -0.1143646240234375, -0.10951042175292969, -0.10465621948242188, -0.09980201721191406, -0.09494781494140625, -0.09009361267089844, -0.08523941040039062, -0.08038520812988281, -0.075531005859375, -0.07067680358886719, -0.06582260131835938, -0.06096839904785156, -0.05611419677734375, -0.05125999450683594, -0.046405792236328125, -0.04155158996582031, -0.0366973876953125, -0.03184318542480469, -0.026988983154296875, -0.022134780883789062, -0.01728057861328125, -0.012426376342773438, -0.007572174072265625, -0.0027179718017578125, 0.00213623046875, 0.0069904327392578125, 0.011844635009765625, 0.016698837280273438, 0.02155303955078125, 0.026407241821289062, 0.031261444091796875, 0.03611564636230469, 0.0409698486328125, 0.04582405090332031, 0.050678253173828125, 0.05553245544433594, 0.06038665771484375, 0.06524085998535156, 0.07009506225585938, 0.07494926452636719, 0.079803466796875, 0.08465766906738281, 0.08951187133789062, 0.09436607360839844, 0.09922027587890625, 0.10407447814941406, 0.10892868041992188, 0.11378288269042969, 0.1186370849609375, 0.12349128723144531, 0.12834548950195312, 0.13319969177246094, 0.13805389404296875, 0.14290809631347656, 0.14776229858398438, 0.1526165008544922, 0.157470703125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [4.0, 4.0, 1.0, 3.0, 2.0, 3.0, 5.0, 3.0, 7.0, 7.0, 8.0, 5.0, 15.0, 13.0, 12.0, 10.0, 21.0, 16.0, 18.0, 24.0, 31.0, 20.0, 40.0, 29.0, 37.0, 54.0, 41.0, 39.0, 47.0, 47.0, 38.0, 34.0, 35.0, 35.0, 33.0, 25.0, 26.0, 11.0, 25.0, 20.0, 16.0, 16.0, 18.0, 13.0, 19.0, 17.0, 13.0, 11.0, 9.0, 8.0, 11.0, 2.0, 4.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 3.0, 0.0, 3.0, 1.0, 1.0], "bins": [-2.3671875, -2.287353515625, -2.20751953125, -2.127685546875, -2.0478515625, -1.968017578125, -1.88818359375, -1.808349609375, -1.728515625, -1.648681640625, -1.56884765625, -1.489013671875, -1.4091796875, -1.329345703125, -1.24951171875, -1.169677734375, -1.08984375, -1.010009765625, -0.93017578125, -0.850341796875, -0.7705078125, -0.690673828125, -0.61083984375, -0.531005859375, -0.451171875, -0.371337890625, -0.29150390625, -0.211669921875, -0.1318359375, -0.052001953125, 0.02783203125, 0.107666015625, 0.1875, 0.267333984375, 0.34716796875, 0.427001953125, 0.5068359375, 0.586669921875, 0.66650390625, 0.746337890625, 0.826171875, 0.906005859375, 0.98583984375, 1.065673828125, 1.1455078125, 1.225341796875, 1.30517578125, 1.385009765625, 1.46484375, 1.544677734375, 1.62451171875, 1.704345703125, 1.7841796875, 1.864013671875, 1.94384765625, 2.023681640625, 2.103515625, 2.183349609375, 2.26318359375, 2.343017578125, 2.4228515625, 2.502685546875, 2.58251953125, 2.662353515625, 2.7421875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 7.0, 11.0, 17.0, 36.0, 41.0, 65.0, 135.0, 178.0, 361.0, 689.0, 1374.0, 3412.0, 10210.0, 37271.0, 154807.0, 441495.0, 293977.0, 75518.0, 19023.0, 5751.0, 2131.0, 899.0, 500.0, 256.0, 157.0, 91.0, 61.0, 24.0, 25.0, 14.0, 6.0, 2.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.053985595703125, -0.052170753479003906, -0.05035591125488281, -0.04854106903076172, -0.046726226806640625, -0.04491138458251953, -0.04309654235839844, -0.041281700134277344, -0.03946685791015625, -0.037652015686035156, -0.03583717346191406, -0.03402233123779297, -0.032207489013671875, -0.03039264678955078, -0.028577804565429688, -0.026762962341308594, -0.0249481201171875, -0.023133277893066406, -0.021318435668945312, -0.01950359344482422, -0.017688751220703125, -0.01587390899658203, -0.014059066772460938, -0.012244224548339844, -0.01042938232421875, -0.008614540100097656, -0.0067996978759765625, -0.004984855651855469, -0.003170013427734375, -0.0013551712036132812, 0.0004596710205078125, 0.0022745132446289062, 0.00408935546875, 0.005904197692871094, 0.0077190399169921875, 0.009533882141113281, 0.011348724365234375, 0.013163566589355469, 0.014978408813476562, 0.016793251037597656, 0.01860809326171875, 0.020422935485839844, 0.022237777709960938, 0.02405261993408203, 0.025867462158203125, 0.02768230438232422, 0.029497146606445312, 0.031311988830566406, 0.0331268310546875, 0.034941673278808594, 0.03675651550292969, 0.03857135772705078, 0.040386199951171875, 0.04220104217529297, 0.04401588439941406, 0.045830726623535156, 0.04764556884765625, 0.049460411071777344, 0.05127525329589844, 0.05309009552001953, 0.054904937744140625, 0.05671977996826172, 0.05853462219238281, 0.060349464416503906, 0.062164306640625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 4.0, 7.0, 12.0, 14.0, 19.0, 28.0, 37.0, 42.0, 53.0, 82.0, 84.0, 112.0, 82.0, 91.0, 84.0, 74.0, 52.0, 39.0, 24.0, 15.0, 12.0, 13.0, 11.0, 2.0, 3.0, 6.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.11732292175293e-05, -2.988334745168686e-05, -2.859346568584442e-05, -2.7303583920001984e-05, -2.6013702154159546e-05, -2.4723820388317108e-05, -2.343393862247467e-05, -2.2144056856632233e-05, -2.0854175090789795e-05, -1.9564293324947357e-05, -1.827441155910492e-05, -1.698452979326248e-05, -1.5694648027420044e-05, -1.4404766261577606e-05, -1.3114884495735168e-05, -1.182500272989273e-05, -1.0535120964050293e-05, -9.245239198207855e-06, -7.955357432365417e-06, -6.66547566652298e-06, -5.375593900680542e-06, -4.085712134838104e-06, -2.7958303689956665e-06, -1.5059486031532288e-06, -2.1606683731079102e-07, 1.0738149285316467e-06, 2.3636966943740845e-06, 3.6535784602165222e-06, 4.94346022605896e-06, 6.233341991901398e-06, 7.5232237577438354e-06, 8.813105523586273e-06, 1.0102987289428711e-05, 1.1392869055271149e-05, 1.2682750821113586e-05, 1.3972632586956024e-05, 1.5262514352798462e-05, 1.65523961186409e-05, 1.7842277884483337e-05, 1.9132159650325775e-05, 2.0422041416168213e-05, 2.171192318201065e-05, 2.300180494785309e-05, 2.4291686713695526e-05, 2.5581568479537964e-05, 2.68714502453804e-05, 2.816133201122284e-05, 2.9451213777065277e-05, 3.0741095542907715e-05, 3.203097730875015e-05, 3.332085907459259e-05, 3.461074084043503e-05, 3.5900622606277466e-05, 3.7190504372119904e-05, 3.848038613796234e-05, 3.977026790380478e-05, 4.106014966964722e-05, 4.2350031435489655e-05, 4.363991320133209e-05, 4.492979496717453e-05, 4.621967673301697e-05, 4.7509558498859406e-05, 4.879944026470184e-05, 5.008932203054428e-05, 5.137920379638672e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 3.0, 8.0, 3.0, 15.0, 15.0, 21.0, 22.0, 33.0, 40.0, 67.0, 127.0, 174.0, 297.0, 609.0, 1213.0, 2811.0, 7912.0, 26809.0, 107771.0, 383912.0, 374547.0, 103296.0, 25736.0, 7666.0, 2903.0, 1157.0, 614.0, 307.0, 157.0, 100.0, 58.0, 44.0, 28.0, 22.0, 18.0, 8.0, 9.0, 5.0, 5.0, 6.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.061126708984375, -0.05932807922363281, -0.057529449462890625, -0.05573081970214844, -0.05393218994140625, -0.05213356018066406, -0.050334930419921875, -0.04853630065917969, -0.0467376708984375, -0.04493904113769531, -0.043140411376953125, -0.04134178161621094, -0.03954315185546875, -0.03774452209472656, -0.035945892333984375, -0.03414726257324219, -0.0323486328125, -0.030550003051757812, -0.028751373291015625, -0.026952743530273438, -0.02515411376953125, -0.023355484008789062, -0.021556854248046875, -0.019758224487304688, -0.0179595947265625, -0.016160964965820312, -0.014362335205078125, -0.012563705444335938, -0.01076507568359375, -0.008966445922851562, -0.007167816162109375, -0.0053691864013671875, -0.003570556640625, -0.0017719268798828125, 2.6702880859375e-05, 0.0018253326416015625, 0.00362396240234375, 0.0054225921630859375, 0.007221221923828125, 0.009019851684570312, 0.0108184814453125, 0.012617111206054688, 0.014415740966796875, 0.016214370727539062, 0.01801300048828125, 0.019811630249023438, 0.021610260009765625, 0.023408889770507812, 0.02520751953125, 0.027006149291992188, 0.028804779052734375, 0.030603408813476562, 0.03240203857421875, 0.03420066833496094, 0.035999298095703125, 0.03779792785644531, 0.0395965576171875, 0.04139518737792969, 0.043193817138671875, 0.04499244689941406, 0.04679107666015625, 0.04858970642089844, 0.050388336181640625, 0.05218696594238281, 0.053985595703125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 3.0, 8.0, 7.0, 9.0, 6.0, 10.0, 23.0, 13.0, 21.0, 25.0, 32.0, 38.0, 45.0, 39.0, 51.0, 51.0, 58.0, 56.0, 66.0, 53.0, 60.0, 55.0, 32.0, 52.0, 33.0, 29.0, 15.0, 25.0, 21.0, 13.0, 8.0, 9.0, 6.0, 2.0, 3.0, 3.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01247406005859375, -0.012079238891601562, -0.011684417724609375, -0.011289596557617188, -0.010894775390625, -0.010499954223632812, -0.010105133056640625, -0.009710311889648438, -0.00931549072265625, -0.008920669555664062, -0.008525848388671875, -0.008131027221679688, -0.0077362060546875, -0.0073413848876953125, -0.006946563720703125, -0.0065517425537109375, -0.00615692138671875, -0.0057621002197265625, -0.005367279052734375, -0.0049724578857421875, -0.00457763671875, -0.0041828155517578125, -0.003787994384765625, -0.0033931732177734375, -0.00299835205078125, -0.0026035308837890625, -0.002208709716796875, -0.0018138885498046875, -0.0014190673828125, -0.0010242462158203125, -0.000629425048828125, -0.0002346038818359375, 0.00016021728515625, 0.0005550384521484375, 0.000949859619140625, 0.0013446807861328125, 0.001739501953125, 0.0021343231201171875, 0.002529144287109375, 0.0029239654541015625, 0.00331878662109375, 0.0037136077880859375, 0.004108428955078125, 0.0045032501220703125, 0.0048980712890625, 0.0052928924560546875, 0.005687713623046875, 0.0060825347900390625, 0.00647735595703125, 0.0068721771240234375, 0.007266998291015625, 0.0076618194580078125, 0.008056640625, 0.008451461791992188, 0.008846282958984375, 0.009241104125976562, 0.00963592529296875, 0.010030746459960938, 0.010425567626953125, 0.010820388793945312, 0.0112152099609375, 0.011610031127929688, 0.012004852294921875, 0.012399673461914062, 0.01279449462890625]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 10.0, 18.0, 34.0, 62.0, 130.0, 143.0, 185.0, 162.0, 126.0, 73.0, 41.0, 12.0, 6.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.458585739135742, -3.3119616508483887, -3.1653378009796143, -3.0187137126922607, -2.8720898628234863, -2.725465774536133, -2.5788416862487793, -2.432217836380005, -2.2855939865112305, -2.138969898223877, -1.9923460483551025, -1.845721960067749, -1.6990981101989746, -1.552474021911621, -1.4058500528335571, -1.2592260837554932, -1.1126019954681396, -0.9659780263900757, -0.8193540573120117, -0.672730028629303, -0.526106059551239, -0.37948209047317505, -0.2328580617904663, -0.08623409271240234, 0.06038987636566162, 0.20701386034488678, 0.35363784432411194, 0.5002618432044983, 0.6468858122825623, 0.7935097813606262, 0.940133810043335, 1.086757779121399, 1.233381748199463, 1.3800057172775269, 1.5266296863555908, 1.6732537746429443, 1.8198776245117188, 1.9665017127990723, 2.113125801086426, 2.2597496509552, 2.4063735008239746, 2.552997589111328, 2.6996214389801025, 2.846245527267456, 2.9928693771362305, 3.139493465423584, 3.2861175537109375, 3.432741403579712, 3.5793654918670654, 3.725989580154419, 3.8726134300231934, 4.019237518310547, 4.1658616065979, 4.312485218048096, 4.459109306335449, 4.605733394622803, 4.752357482910156, 4.89898157119751, 5.045605659484863, 5.192229270935059, 5.338853359222412, 5.485477447509766, 5.632101535797119, 5.778725624084473, 5.925349235534668]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 7.0, 10.0, 27.0, 25.0, 31.0, 37.0, 46.0, 61.0, 91.0, 89.0, 71.0, 82.0, 88.0, 75.0, 64.0, 60.0, 45.0, 31.0, 18.0, 17.0, 9.0, 12.0, 4.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.437211513519287, -3.353278160095215, -3.2693448066711426, -3.1854114532470703, -3.101478099822998, -3.017544746398926, -2.9336113929748535, -2.8496780395507812, -2.765744686126709, -2.6818113327026367, -2.5978779792785645, -2.513944625854492, -2.43001127243042, -2.3460779190063477, -2.2621445655822754, -2.178211212158203, -2.0942776203155518, -2.0103442668914795, -1.9264109134674072, -1.842477560043335, -1.7585442066192627, -1.6746108531951904, -1.5906773805618286, -1.5067440271377563, -1.422810673713684, -1.3388773202896118, -1.2549439668655396, -1.1710104942321777, -1.0870771408081055, -1.0031437873840332, -0.9192104339599609, -0.8352770805358887, -0.7513439655303955, -0.6674106121063232, -0.583477258682251, -0.49954384565353394, -0.41561049222946167, -0.3316771388053894, -0.24774372577667236, -0.1638103723526001, -0.07987701892852783, 0.0040563493967056274, 0.08798971772193909, 0.17192310094833374, 0.255856454372406, 0.33978980779647827, 0.4237232208251953, 0.5076565742492676, 0.5915899276733398, 0.6755232810974121, 0.7594566345214844, 0.8433900475502014, 0.9273234009742737, 1.0112566947937012, 1.095190167427063, 1.1791235208511353, 1.2630568742752075, 1.3469902276992798, 1.430923581123352, 1.5148570537567139, 1.5987904071807861, 1.6827237606048584, 1.7666571140289307, 1.850590467453003, 1.9345238208770752]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 2.0, 3.0, 7.0, 6.0, 5.0, 7.0, 4.0, 8.0, 16.0, 28.0, 27.0, 54.0, 86.0, 151.0, 257.0, 573.0, 1284.0, 3409.0, 10156.0, 34169.0, 143262.0, 628872.0, 170017.0, 38548.0, 11248.0, 3705.0, 1407.0, 549.0, 278.0, 152.0, 94.0, 44.0, 41.0, 30.0, 16.0, 14.0, 9.0, 4.0, 2.0, 2.0, 4.0, 0.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.400390625, -2.31915283203125, -2.2379150390625, -2.15667724609375, -2.075439453125, -1.99420166015625, -1.9129638671875, -1.83172607421875, -1.75048828125, -1.66925048828125, -1.5880126953125, -1.50677490234375, -1.425537109375, -1.34429931640625, -1.2630615234375, -1.18182373046875, -1.1005859375, -1.01934814453125, -0.9381103515625, -0.85687255859375, -0.775634765625, -0.69439697265625, -0.6131591796875, -0.53192138671875, -0.45068359375, -0.36944580078125, -0.2882080078125, -0.20697021484375, -0.125732421875, -0.04449462890625, 0.0367431640625, 0.11798095703125, 0.19921875, 0.28045654296875, 0.3616943359375, 0.44293212890625, 0.524169921875, 0.60540771484375, 0.6866455078125, 0.76788330078125, 0.84912109375, 0.93035888671875, 1.0115966796875, 1.09283447265625, 1.174072265625, 1.25531005859375, 1.3365478515625, 1.41778564453125, 1.4990234375, 1.58026123046875, 1.6614990234375, 1.74273681640625, 1.823974609375, 1.90521240234375, 1.9864501953125, 2.06768798828125, 2.14892578125, 2.23016357421875, 2.3114013671875, 2.39263916015625, 2.473876953125, 2.55511474609375, 2.6363525390625, 2.71759033203125, 2.798828125]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 6.0, 0.0, 5.0, 2.0, 5.0, 11.0, 12.0, 18.0, 22.0, 21.0, 18.0, 26.0, 35.0, 27.0, 41.0, 37.0, 59.0, 45.0, 64.0, 48.0, 60.0, 57.0, 53.0, 50.0, 44.0, 35.0, 35.0, 42.0, 26.0, 24.0, 18.0, 10.0, 13.0, 9.0, 7.0, 5.0, 6.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.697265625, -2.600738525390625, -2.50421142578125, -2.407684326171875, -2.3111572265625, -2.214630126953125, -2.11810302734375, -2.021575927734375, -1.925048828125, -1.828521728515625, -1.73199462890625, -1.635467529296875, -1.5389404296875, -1.442413330078125, -1.34588623046875, -1.249359130859375, -1.15283203125, -1.056304931640625, -0.95977783203125, -0.863250732421875, -0.7667236328125, -0.670196533203125, -0.57366943359375, -0.477142333984375, -0.380615234375, -0.284088134765625, -0.18756103515625, -0.091033935546875, 0.0054931640625, 0.102020263671875, 0.19854736328125, 0.295074462890625, 0.3916015625, 0.488128662109375, 0.58465576171875, 0.681182861328125, 0.7777099609375, 0.874237060546875, 0.97076416015625, 1.067291259765625, 1.163818359375, 1.260345458984375, 1.35687255859375, 1.453399658203125, 1.5499267578125, 1.646453857421875, 1.74298095703125, 1.839508056640625, 1.93603515625, 2.032562255859375, 2.12908935546875, 2.225616455078125, 2.3221435546875, 2.418670654296875, 2.51519775390625, 2.611724853515625, 2.708251953125, 2.804779052734375, 2.90130615234375, 2.997833251953125, 3.0943603515625, 3.190887451171875, 3.28741455078125, 3.383941650390625, 3.48046875]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 6.0, 14.0, 16.0, 27.0, 24.0, 46.0, 60.0, 78.0, 147.0, 244.0, 475.0, 1553.0, 20636.0, 886914.0, 132380.0, 4402.0, 745.0, 291.0, 170.0, 106.0, 67.0, 46.0, 28.0, 26.0, 19.0, 11.0, 8.0, 10.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.69140625, -5.47857666015625, -5.2657470703125, -5.05291748046875, -4.840087890625, -4.62725830078125, -4.4144287109375, -4.20159912109375, -3.98876953125, -3.77593994140625, -3.5631103515625, -3.35028076171875, -3.137451171875, -2.92462158203125, -2.7117919921875, -2.49896240234375, -2.2861328125, -2.07330322265625, -1.8604736328125, -1.64764404296875, -1.434814453125, -1.22198486328125, -1.0091552734375, -0.79632568359375, -0.58349609375, -0.37066650390625, -0.1578369140625, 0.05499267578125, 0.267822265625, 0.48065185546875, 0.6934814453125, 0.90631103515625, 1.119140625, 1.33197021484375, 1.5447998046875, 1.75762939453125, 1.970458984375, 2.18328857421875, 2.3961181640625, 2.60894775390625, 2.82177734375, 3.03460693359375, 3.2474365234375, 3.46026611328125, 3.673095703125, 3.88592529296875, 4.0987548828125, 4.31158447265625, 4.5244140625, 4.73724365234375, 4.9500732421875, 5.16290283203125, 5.375732421875, 5.58856201171875, 5.8013916015625, 6.01422119140625, 6.22705078125, 6.43988037109375, 6.6527099609375, 6.86553955078125, 7.078369140625, 7.29119873046875, 7.5040283203125, 7.71685791015625, 7.9296875]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 3.0, 2.0, 4.0, 5.0, 10.0, 8.0, 13.0, 16.0, 19.0, 22.0, 29.0, 34.0, 36.0, 43.0, 53.0, 40.0, 58.0, 65.0, 64.0, 49.0, 64.0, 50.0, 44.0, 34.0, 47.0, 36.0, 29.0, 29.0, 25.0, 10.0, 17.0, 10.0, 18.0, 5.0, 3.0, 5.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-4.5859375, -4.46826171875, -4.3505859375, -4.23291015625, -4.115234375, -3.99755859375, -3.8798828125, -3.76220703125, -3.64453125, -3.52685546875, -3.4091796875, -3.29150390625, -3.173828125, -3.05615234375, -2.9384765625, -2.82080078125, -2.703125, -2.58544921875, -2.4677734375, -2.35009765625, -2.232421875, -2.11474609375, -1.9970703125, -1.87939453125, -1.76171875, -1.64404296875, -1.5263671875, -1.40869140625, -1.291015625, -1.17333984375, -1.0556640625, -0.93798828125, -0.8203125, -0.70263671875, -0.5849609375, -0.46728515625, -0.349609375, -0.23193359375, -0.1142578125, 0.00341796875, 0.12109375, 0.23876953125, 0.3564453125, 0.47412109375, 0.591796875, 0.70947265625, 0.8271484375, 0.94482421875, 1.0625, 1.18017578125, 1.2978515625, 1.41552734375, 1.533203125, 1.65087890625, 1.7685546875, 1.88623046875, 2.00390625, 2.12158203125, 2.2392578125, 2.35693359375, 2.474609375, 2.59228515625, 2.7099609375, 2.82763671875, 2.9453125]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 3.0, 5.0, 9.0, 18.0, 13.0, 33.0, 37.0, 69.0, 129.0, 294.0, 790.0, 3028.0, 37705.0, 901938.0, 97670.0, 5018.0, 1077.0, 341.0, 154.0, 82.0, 51.0, 27.0, 18.0, 17.0, 5.0, 6.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.765625, -1.70172119140625, -1.6378173828125, -1.57391357421875, -1.510009765625, -1.44610595703125, -1.3822021484375, -1.31829833984375, -1.25439453125, -1.19049072265625, -1.1265869140625, -1.06268310546875, -0.998779296875, -0.93487548828125, -0.8709716796875, -0.80706787109375, -0.7431640625, -0.67926025390625, -0.6153564453125, -0.55145263671875, -0.487548828125, -0.42364501953125, -0.3597412109375, -0.29583740234375, -0.23193359375, -0.16802978515625, -0.1041259765625, -0.04022216796875, 0.023681640625, 0.08758544921875, 0.1514892578125, 0.21539306640625, 0.279296875, 0.34320068359375, 0.4071044921875, 0.47100830078125, 0.534912109375, 0.59881591796875, 0.6627197265625, 0.72662353515625, 0.79052734375, 0.85443115234375, 0.9183349609375, 0.98223876953125, 1.046142578125, 1.11004638671875, 1.1739501953125, 1.23785400390625, 1.3017578125, 1.36566162109375, 1.4295654296875, 1.49346923828125, 1.557373046875, 1.62127685546875, 1.6851806640625, 1.74908447265625, 1.81298828125, 1.87689208984375, 1.9407958984375, 2.00469970703125, 2.068603515625, 2.13250732421875, 2.1964111328125, 2.26031494140625, 2.32421875]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 6.0, 7.0, 10.0, 12.0, 23.0, 44.0, 37.0, 73.0, 119.0, 199.0, 171.0, 95.0, 69.0, 30.0, 31.0, 21.0, 18.0, 15.0, 4.0, 8.0, 5.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00020563602447509766, -0.00019852258265018463, -0.0001914091408252716, -0.00018429569900035858, -0.00017718225717544556, -0.00017006881535053253, -0.0001629553735256195, -0.00015584193170070648, -0.00014872848987579346, -0.00014161504805088043, -0.0001345016062259674, -0.00012738816440105438, -0.00012027472257614136, -0.00011316128075122833, -0.00010604783892631531, -9.893439710140228e-05, -9.182095527648926e-05, -8.470751345157623e-05, -7.759407162666321e-05, -7.048062980175018e-05, -6.336718797683716e-05, -5.625374615192413e-05, -4.914030432701111e-05, -4.2026862502098083e-05, -3.491342067718506e-05, -2.7799978852272034e-05, -2.068653702735901e-05, -1.3573095202445984e-05, -6.459653377532959e-06, 6.537884473800659e-07, 7.76723027229309e-06, 1.4880672097206116e-05, 2.199411392211914e-05, 2.9107555747032166e-05, 3.622099757194519e-05, 4.3334439396858215e-05, 5.044788122177124e-05, 5.7561323046684265e-05, 6.467476487159729e-05, 7.178820669651031e-05, 7.890164852142334e-05, 8.601509034633636e-05, 9.312853217124939e-05, 0.00010024197399616241, 0.00010735541582107544, 0.00011446885764598846, 0.00012158229947090149, 0.00012869574129581451, 0.00013580918312072754, 0.00014292262494564056, 0.0001500360667705536, 0.00015714950859546661, 0.00016426295042037964, 0.00017137639224529266, 0.0001784898340702057, 0.0001856032758951187, 0.00019271671772003174, 0.00019983015954494476, 0.0002069436013698578, 0.0002140570431947708, 0.00022117048501968384, 0.00022828392684459686, 0.0002353973686695099, 0.0002425108104944229, 0.00024962425231933594]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 3.0, 8.0, 10.0, 38.0, 35.0, 66.0, 138.0, 266.0, 560.0, 1428.0, 5026.0, 52187.0, 866079.0, 112071.0, 7546.0, 1830.0, 633.0, 305.0, 129.0, 85.0, 44.0, 22.0, 12.0, 7.0, 6.0, 8.0, 0.0, 2.0, 3.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.7255859375, -1.6631011962890625, -1.600616455078125, -1.5381317138671875, -1.47564697265625, -1.4131622314453125, -1.350677490234375, -1.2881927490234375, -1.2257080078125, -1.1632232666015625, -1.100738525390625, -1.0382537841796875, -0.97576904296875, -0.9132843017578125, -0.850799560546875, -0.7883148193359375, -0.725830078125, -0.6633453369140625, -0.600860595703125, -0.5383758544921875, -0.47589111328125, -0.4134063720703125, -0.350921630859375, -0.2884368896484375, -0.2259521484375, -0.1634674072265625, -0.100982666015625, -0.0384979248046875, 0.02398681640625, 0.0864715576171875, 0.148956298828125, 0.2114410400390625, 0.27392578125, 0.3364105224609375, 0.398895263671875, 0.4613800048828125, 0.52386474609375, 0.5863494873046875, 0.648834228515625, 0.7113189697265625, 0.7738037109375, 0.8362884521484375, 0.898773193359375, 0.9612579345703125, 1.02374267578125, 1.0862274169921875, 1.148712158203125, 1.2111968994140625, 1.273681640625, 1.3361663818359375, 1.398651123046875, 1.4611358642578125, 1.52362060546875, 1.5861053466796875, 1.648590087890625, 1.7110748291015625, 1.7735595703125, 1.8360443115234375, 1.898529052734375, 1.9610137939453125, 2.02349853515625, 2.0859832763671875, 2.148468017578125, 2.2109527587890625, 2.2734375]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 4.0, 6.0, 6.0, 11.0, 28.0, 32.0, 51.0, 90.0, 127.0, 249.0, 138.0, 104.0, 46.0, 37.0, 25.0, 22.0, 7.0, 7.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.9521484375, -0.9312896728515625, -0.910430908203125, -0.8895721435546875, -0.86871337890625, -0.8478546142578125, -0.826995849609375, -0.8061370849609375, -0.7852783203125, -0.7644195556640625, -0.743560791015625, -0.7227020263671875, -0.70184326171875, -0.6809844970703125, -0.660125732421875, -0.6392669677734375, -0.618408203125, -0.5975494384765625, -0.576690673828125, -0.5558319091796875, -0.53497314453125, -0.5141143798828125, -0.493255615234375, -0.4723968505859375, -0.4515380859375, -0.4306793212890625, -0.409820556640625, -0.3889617919921875, -0.36810302734375, -0.3472442626953125, -0.326385498046875, -0.3055267333984375, -0.28466796875, -0.2638092041015625, -0.242950439453125, -0.2220916748046875, -0.20123291015625, -0.1803741455078125, -0.159515380859375, -0.1386566162109375, -0.1177978515625, -0.0969390869140625, -0.076080322265625, -0.0552215576171875, -0.03436279296875, -0.0135040283203125, 0.007354736328125, 0.0282135009765625, 0.049072265625, 0.0699310302734375, 0.090789794921875, 0.1116485595703125, 0.13250732421875, 0.1533660888671875, 0.174224853515625, 0.1950836181640625, 0.2159423828125, 0.2368011474609375, 0.257659912109375, 0.2785186767578125, 0.29937744140625, 0.3202362060546875, 0.341094970703125, 0.3619537353515625, 0.3828125]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 14.0, 90.0, 314.0, 399.0, 158.0, 30.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-39.453025817871094, -38.737335205078125, -38.021644592285156, -37.30595397949219, -36.59026336669922, -35.874576568603516, -35.15888595581055, -34.44319534301758, -33.72750473022461, -33.01181411743164, -32.29612350463867, -31.580434799194336, -30.864744186401367, -30.1490535736084, -29.433364868164062, -28.717674255371094, -28.001983642578125, -27.286293029785156, -26.570602416992188, -25.85491371154785, -25.139223098754883, -24.423532485961914, -23.707843780517578, -22.99215316772461, -22.27646255493164, -21.560771942138672, -20.845081329345703, -20.129392623901367, -19.4137020111084, -18.69801139831543, -17.982322692871094, -17.266632080078125, -16.550941467285156, -15.835250854492188, -15.119561195373535, -14.403871536254883, -13.688180923461914, -12.972490310668945, -12.256800651550293, -11.54111099243164, -10.825420379638672, -10.109729766845703, -9.39404010772705, -8.678350448608398, -7.96265983581543, -7.246969699859619, -6.531279563903809, -5.815589427947998, -5.0998992919921875, -4.384209156036377, -3.6685190200805664, -2.952828884124756, -2.2371387481689453, -1.5214486122131348, -0.8057584762573242, -0.09006834030151367, 0.6256217956542969, 1.3413119316101074, 2.057002067565918, 2.7726922035217285, 3.488382339477539, 4.20407247543335, 4.91976261138916, 5.635452747344971, 6.351142883300781]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 7.0, 3.0, 11.0, 11.0, 12.0, 12.0, 14.0, 20.0, 20.0, 23.0, 29.0, 23.0, 32.0, 35.0, 40.0, 40.0, 42.0, 56.0, 45.0, 46.0, 47.0, 36.0, 41.0, 38.0, 31.0, 35.0, 40.0, 32.0, 20.0, 30.0, 27.0, 15.0, 15.0, 14.0, 10.0, 12.0, 6.0, 7.0, 7.0, 5.0, 6.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-5.363114356994629, -5.211436748504639, -5.059759616851807, -4.908082008361816, -4.756404876708984, -4.604727268218994, -4.453050136566162, -4.301372528076172, -4.14969539642334, -3.9980180263519287, -3.8463406562805176, -3.6946632862091064, -3.5429859161376953, -3.391308307647705, -3.239630937576294, -3.087953567504883, -2.9362759590148926, -2.7845985889434814, -2.6329212188720703, -2.481243848800659, -2.329566478729248, -2.177888870239258, -2.0262115001678467, -1.8745341300964355, -1.7228567600250244, -1.5711793899536133, -1.4195020198822021, -1.2678245306015015, -1.1161471605300903, -0.9644697904586792, -0.8127923607826233, -0.6611149311065674, -0.509437084197998, -0.3577596843242645, -0.206082284450531, -0.054404884576797485, 0.09727251529693604, 0.24894988536834717, 0.4006273150444031, 0.552304744720459, 0.7039821147918701, 0.8556594848632812, 1.0073368549346924, 1.159014344215393, 1.3106917142868042, 1.4623690843582153, 1.614046573638916, 1.7657239437103271, 1.9174013137817383, 2.0690786838531494, 2.2207560539245605, 2.3724334239959717, 2.524110794067383, 2.675788402557373, 2.827465772628784, 2.9791431427001953, 3.1308205127716064, 3.2824978828430176, 3.4341752529144287, 3.58585262298584, 3.73753023147583, 3.889207363128662, 4.040884971618652, 4.192562103271484, 4.344239711761475]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 5.0, 8.0, 7.0, 7.0, 14.0, 11.0, 17.0, 20.0, 22.0, 24.0, 36.0, 56.0, 73.0, 72.0, 101.0, 143.0, 210.0, 356.0, 660.0, 1420.0, 4138.0, 18343.0, 129601.0, 1509500.0, 2284506.0, 211069.0, 25473.0, 5054.0, 1455.0, 645.0, 324.0, 223.0, 147.0, 111.0, 81.0, 74.0, 55.0, 53.0, 31.0, 28.0, 19.0, 21.0, 17.0, 19.0, 9.0, 10.0, 3.0, 3.0, 2.0, 4.0, 5.0, 2.0, 2.0, 2.0, 1.0], "bins": [-3.634765625, -3.524993896484375, -3.41522216796875, -3.305450439453125, -3.1956787109375, -3.085906982421875, -2.97613525390625, -2.866363525390625, -2.756591796875, -2.646820068359375, -2.53704833984375, -2.427276611328125, -2.3175048828125, -2.207733154296875, -2.09796142578125, -1.988189697265625, -1.87841796875, -1.768646240234375, -1.65887451171875, -1.549102783203125, -1.4393310546875, -1.329559326171875, -1.21978759765625, -1.110015869140625, -1.000244140625, -0.890472412109375, -0.78070068359375, -0.670928955078125, -0.5611572265625, -0.451385498046875, -0.34161376953125, -0.231842041015625, -0.1220703125, -0.012298583984375, 0.09747314453125, 0.207244873046875, 0.3170166015625, 0.426788330078125, 0.53656005859375, 0.646331787109375, 0.756103515625, 0.865875244140625, 0.97564697265625, 1.085418701171875, 1.1951904296875, 1.304962158203125, 1.41473388671875, 1.524505615234375, 1.63427734375, 1.744049072265625, 1.85382080078125, 1.963592529296875, 2.0733642578125, 2.183135986328125, 2.29290771484375, 2.402679443359375, 2.512451171875, 2.622222900390625, 2.73199462890625, 2.841766357421875, 2.9515380859375, 3.061309814453125, 3.17108154296875, 3.280853271484375, 3.390625]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 4.0, 3.0, 5.0, 3.0, 6.0, 7.0, 10.0, 23.0, 23.0, 21.0, 26.0, 22.0, 36.0, 46.0, 64.0, 54.0, 68.0, 52.0, 56.0, 61.0, 70.0, 56.0, 60.0, 39.0, 38.0, 30.0, 31.0, 21.0, 18.0, 11.0, 13.0, 9.0, 7.0, 5.0, 4.0, 4.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4189453125, -1.3559722900390625, -1.292999267578125, -1.2300262451171875, -1.16705322265625, -1.1040802001953125, -1.041107177734375, -0.9781341552734375, -0.9151611328125, -0.8521881103515625, -0.789215087890625, -0.7262420654296875, -0.66326904296875, -0.6002960205078125, -0.537322998046875, -0.4743499755859375, -0.411376953125, -0.3484039306640625, -0.285430908203125, -0.2224578857421875, -0.15948486328125, -0.0965118408203125, -0.033538818359375, 0.0294342041015625, 0.0924072265625, 0.1553802490234375, 0.218353271484375, 0.2813262939453125, 0.34429931640625, 0.4072723388671875, 0.470245361328125, 0.5332183837890625, 0.59619140625, 0.6591644287109375, 0.722137451171875, 0.7851104736328125, 0.84808349609375, 0.9110565185546875, 0.974029541015625, 1.0370025634765625, 1.0999755859375, 1.1629486083984375, 1.225921630859375, 1.2888946533203125, 1.35186767578125, 1.4148406982421875, 1.477813720703125, 1.5407867431640625, 1.603759765625, 1.6667327880859375, 1.729705810546875, 1.7926788330078125, 1.85565185546875, 1.9186248779296875, 1.981597900390625, 2.0445709228515625, 2.1075439453125, 2.1705169677734375, 2.233489990234375, 2.2964630126953125, 2.35943603515625, 2.4224090576171875, 2.485382080078125, 2.5483551025390625, 2.611328125]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 11.0, 12.0, 26.0, 74.0, 178.0, 595.0, 3535.0, 180510.0, 3987668.0, 19509.0, 1584.0, 343.0, 114.0, 49.0, 29.0, 14.0, 9.0, 11.0, 4.0, 3.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.89453125, -5.55352783203125, -5.2125244140625, -4.87152099609375, -4.530517578125, -4.18951416015625, -3.8485107421875, -3.50750732421875, -3.16650390625, -2.82550048828125, -2.4844970703125, -2.14349365234375, -1.802490234375, -1.46148681640625, -1.1204833984375, -0.77947998046875, -0.4384765625, -0.09747314453125, 0.2435302734375, 0.58453369140625, 0.925537109375, 1.26654052734375, 1.6075439453125, 1.94854736328125, 2.28955078125, 2.63055419921875, 2.9715576171875, 3.31256103515625, 3.653564453125, 3.99456787109375, 4.3355712890625, 4.67657470703125, 5.017578125, 5.35858154296875, 5.6995849609375, 6.04058837890625, 6.381591796875, 6.72259521484375, 7.0635986328125, 7.40460205078125, 7.74560546875, 8.08660888671875, 8.4276123046875, 8.76861572265625, 9.109619140625, 9.45062255859375, 9.7916259765625, 10.13262939453125, 10.4736328125, 10.81463623046875, 11.1556396484375, 11.49664306640625, 11.837646484375, 12.17864990234375, 12.5196533203125, 12.86065673828125, 13.20166015625, 13.54266357421875, 13.8836669921875, 14.22467041015625, 14.565673828125, 14.90667724609375, 15.2476806640625, 15.58868408203125, 15.9296875]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 6.0, 5.0, 5.0, 5.0, 11.0, 23.0, 35.0, 47.0, 73.0, 115.0, 226.0, 355.0, 534.0, 745.0, 655.0, 480.0, 280.0, 192.0, 100.0, 64.0, 40.0, 29.0, 12.0, 12.0, 8.0, 3.0, 6.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-1.7763671875, -1.7358932495117188, -1.6954193115234375, -1.6549453735351562, -1.614471435546875, -1.5739974975585938, -1.5335235595703125, -1.4930496215820312, -1.45257568359375, -1.4121017456054688, -1.3716278076171875, -1.3311538696289062, -1.290679931640625, -1.2502059936523438, -1.2097320556640625, -1.1692581176757812, -1.1287841796875, -1.0883102416992188, -1.0478363037109375, -1.0073623657226562, -0.966888427734375, -0.9264144897460938, -0.8859405517578125, -0.8454666137695312, -0.80499267578125, -0.7645187377929688, -0.7240447998046875, -0.6835708618164062, -0.643096923828125, -0.6026229858398438, -0.5621490478515625, -0.5216751098632812, -0.481201171875, -0.44072723388671875, -0.4002532958984375, -0.35977935791015625, -0.319305419921875, -0.27883148193359375, -0.2383575439453125, -0.19788360595703125, -0.15740966796875, -0.11693572998046875, -0.0764617919921875, -0.03598785400390625, 0.004486083984375, 0.04496002197265625, 0.0854339599609375, 0.12590789794921875, 0.1663818359375, 0.20685577392578125, 0.2473297119140625, 0.28780364990234375, 0.328277587890625, 0.36875152587890625, 0.4092254638671875, 0.44969940185546875, 0.49017333984375, 0.5306472778320312, 0.5711212158203125, 0.6115951538085938, 0.652069091796875, 0.6925430297851562, 0.7330169677734375, 0.7734909057617188, 0.81396484375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 9.0, 8.0, 14.0, 14.0, 29.0, 26.0, 36.0, 46.0, 49.0, 63.0, 91.0, 72.0, 75.0, 74.0, 76.0, 73.0, 58.0, 46.0, 42.0, 38.0, 24.0, 14.0, 11.0, 9.0, 7.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.992717981338501, -1.8936253786087036, -1.7945326566696167, -1.6954400539398193, -1.5963473320007324, -1.497254729270935, -1.3981621265411377, -1.2990694046020508, -1.1999768018722534, -1.100884199142456, -1.0017914772033691, -0.9026988744735718, -0.8036062121391296, -0.7045135498046875, -0.6054209470748901, -0.506328284740448, -0.40723562240600586, -0.3081429600715637, -0.20905032753944397, -0.10995769500732422, -0.01086503267288208, 0.08822762966156006, 0.18732023239135742, 0.28641289472579956, 0.3855055570602417, 0.48459821939468384, 0.583690881729126, 0.6827834844589233, 0.7818761467933655, 0.8809688091278076, 0.980061411857605, 1.0791540145874023, 1.1782464981079102, 1.2773391008377075, 1.3764318227767944, 1.4755244255065918, 1.5746171474456787, 1.673709750175476, 1.7728023529052734, 1.8718950748443604, 1.9709876775741577, 2.070080280303955, 2.169173002243042, 2.268265724182129, 2.3673582077026367, 2.4664509296417236, 2.5655436515808105, 2.6646361351013184, 2.7637288570404053, 2.862821578979492, 2.9619140625, 3.061006784439087, 3.160099506378174, 3.2591919898986816, 3.3582847118377686, 3.4573774337768555, 3.5564699172973633, 3.65556263923645, 3.754655122756958, 3.853747844696045, 3.952840566635132, 4.051933288574219, 4.151025772094727, 4.250118255615234, 4.3492112159729]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 6.0, 3.0, 4.0, 5.0, 10.0, 5.0, 7.0, 14.0, 16.0, 15.0, 14.0, 12.0, 38.0, 22.0, 26.0, 32.0, 31.0, 38.0, 36.0, 48.0, 43.0, 37.0, 41.0, 36.0, 29.0, 44.0, 39.0, 35.0, 33.0, 30.0, 32.0, 22.0, 32.0, 29.0, 30.0, 14.0, 18.0, 13.0, 12.0, 5.0, 10.0, 12.0, 5.0, 9.0, 6.0, 1.0, 2.0, 3.0, 0.0, 2.0, 2.0, 2.0], "bins": [-1.9949958324432373, -1.9377926588058472, -1.880589485168457, -1.823386311531067, -1.7661831378936768, -1.7089799642562866, -1.6517767906188965, -1.594573736190796, -1.5373704433441162, -1.480167269706726, -1.422964096069336, -1.3657609224319458, -1.3085577487945557, -1.2513545751571655, -1.1941514015197754, -1.1369483470916748, -1.0797451734542847, -1.0225419998168945, -0.9653388261795044, -0.9081356525421143, -0.8509324789047241, -0.793729305267334, -0.7365261912345886, -0.6793230175971985, -0.6221198439598083, -0.5649166703224182, -0.5077134966850281, -0.4505103528499603, -0.3933071792125702, -0.33610400557518005, -0.2789008617401123, -0.22169768810272217, -0.16449439525604248, -0.10729122906923294, -0.0500880628824234, 0.007115095853805542, 0.06431826949119568, 0.12152144312858582, 0.17872458696365356, 0.2359277606010437, 0.29313093423843384, 0.350334107875824, 0.4075372815132141, 0.46474042534828186, 0.5219435691833496, 0.5791467428207397, 0.6363499164581299, 0.69355309009552, 0.7507562637329102, 0.8079594373703003, 0.8651626110076904, 0.9223657846450806, 0.9795689582824707, 1.0367721319198608, 1.093975305557251, 1.1511783599853516, 1.2083816528320312, 1.2655848264694214, 1.3227880001068115, 1.3799911737442017, 1.4371943473815918, 1.494397521018982, 1.551600694656372, 1.6088037490844727, 1.6660069227218628]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 4.0, 11.0, 4.0, 14.0, 11.0, 13.0, 29.0, 24.0, 35.0, 36.0, 77.0, 70.0, 129.0, 192.0, 319.0, 607.0, 1120.0, 2195.0, 5134.0, 13797.0, 42934.0, 145486.0, 385062.0, 305963.0, 98251.0, 29254.0, 9798.0, 3933.0, 1768.0, 921.0, 486.0, 278.0, 174.0, 103.0, 87.0, 59.0, 36.0, 40.0, 32.0, 16.0, 7.0, 16.0, 15.0, 5.0, 4.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.455078125, -0.43982696533203125, -0.4245758056640625, -0.40932464599609375, -0.394073486328125, -0.37882232666015625, -0.3635711669921875, -0.34832000732421875, -0.33306884765625, -0.31781768798828125, -0.3025665283203125, -0.28731536865234375, -0.272064208984375, -0.25681304931640625, -0.2415618896484375, -0.22631072998046875, -0.2110595703125, -0.19580841064453125, -0.1805572509765625, -0.16530609130859375, -0.150054931640625, -0.13480377197265625, -0.1195526123046875, -0.10430145263671875, -0.08905029296875, -0.07379913330078125, -0.0585479736328125, -0.04329681396484375, -0.028045654296875, -0.01279449462890625, 0.0024566650390625, 0.01770782470703125, 0.032958984375, 0.04821014404296875, 0.0634613037109375, 0.07871246337890625, 0.093963623046875, 0.10921478271484375, 0.1244659423828125, 0.13971710205078125, 0.15496826171875, 0.17021942138671875, 0.1854705810546875, 0.20072174072265625, 0.215972900390625, 0.23122406005859375, 0.2464752197265625, 0.26172637939453125, 0.2769775390625, 0.29222869873046875, 0.3074798583984375, 0.32273101806640625, 0.337982177734375, 0.35323333740234375, 0.3684844970703125, 0.38373565673828125, 0.39898681640625, 0.41423797607421875, 0.4294891357421875, 0.44474029541015625, 0.459991455078125, 0.47524261474609375, 0.4904937744140625, 0.5057449340820312, 0.52099609375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 7.0, 7.0, 3.0, 6.0, 10.0, 9.0, 7.0, 15.0, 16.0, 16.0, 34.0, 22.0, 39.0, 33.0, 32.0, 37.0, 54.0, 44.0, 49.0, 38.0, 46.0, 37.0, 33.0, 52.0, 29.0, 35.0, 31.0, 31.0, 32.0, 25.0, 39.0, 23.0, 22.0, 17.0, 11.0, 9.0, 14.0, 5.0, 9.0, 7.0, 8.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.126953125, -1.0890655517578125, -1.051177978515625, -1.0132904052734375, -0.97540283203125, -0.9375152587890625, -0.899627685546875, -0.8617401123046875, -0.8238525390625, -0.7859649658203125, -0.748077392578125, -0.7101898193359375, -0.67230224609375, -0.6344146728515625, -0.596527099609375, -0.5586395263671875, -0.520751953125, -0.4828643798828125, -0.444976806640625, -0.4070892333984375, -0.36920166015625, -0.3313140869140625, -0.293426513671875, -0.2555389404296875, -0.2176513671875, -0.1797637939453125, -0.141876220703125, -0.1039886474609375, -0.06610107421875, -0.0282135009765625, 0.009674072265625, 0.0475616455078125, 0.08544921875, 0.1233367919921875, 0.161224365234375, 0.1991119384765625, 0.23699951171875, 0.2748870849609375, 0.312774658203125, 0.3506622314453125, 0.3885498046875, 0.4264373779296875, 0.464324951171875, 0.5022125244140625, 0.54010009765625, 0.5779876708984375, 0.615875244140625, 0.6537628173828125, 0.691650390625, 0.7295379638671875, 0.767425537109375, 0.8053131103515625, 0.84320068359375, 0.8810882568359375, 0.918975830078125, 0.9568634033203125, 0.9947509765625, 1.0326385498046875, 1.070526123046875, 1.1084136962890625, 1.14630126953125, 1.1841888427734375, 1.222076416015625, 1.2599639892578125, 1.2978515625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 5.0, 7.0, 12.0, 17.0, 22.0, 24.0, 40.0, 69.0, 91.0, 153.0, 198.0, 310.0, 418.0, 666.0, 903.0, 1412.0, 2198.0, 3203.0, 4916.0, 7397.0, 11938.0, 17835.0, 28728.0, 45209.0, 70343.0, 106419.0, 147263.0, 166984.0, 143113.0, 101776.0, 67288.0, 43036.0, 27014.0, 17325.0, 11049.0, 7060.0, 4712.0, 3196.0, 2075.0, 1355.0, 868.0, 632.0, 419.0, 273.0, 196.0, 133.0, 79.0, 60.0, 43.0, 26.0, 20.0, 18.0, 11.0, 6.0, 3.0, 1.0, 0.0, 5.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.130615234375, -0.12618064880371094, -0.12174606323242188, -0.11731147766113281, -0.11287689208984375, -0.10844230651855469, -0.10400772094726562, -0.09957313537597656, -0.0951385498046875, -0.09070396423339844, -0.08626937866210938, -0.08183479309082031, -0.07740020751953125, -0.07296562194824219, -0.06853103637695312, -0.06409645080566406, -0.059661865234375, -0.05522727966308594, -0.050792694091796875, -0.04635810852050781, -0.04192352294921875, -0.03748893737792969, -0.033054351806640625, -0.028619766235351562, -0.0241851806640625, -0.019750595092773438, -0.015316009521484375, -0.010881423950195312, -0.00644683837890625, -0.0020122528076171875, 0.002422332763671875, 0.0068569183349609375, 0.01129150390625, 0.015726089477539062, 0.020160675048828125, 0.024595260620117188, 0.02902984619140625, 0.03346443176269531, 0.037899017333984375, 0.04233360290527344, 0.0467681884765625, 0.05120277404785156, 0.055637359619140625, 0.06007194519042969, 0.06450653076171875, 0.06894111633300781, 0.07337570190429688, 0.07781028747558594, 0.082244873046875, 0.08667945861816406, 0.09111404418945312, 0.09554862976074219, 0.09998321533203125, 0.10441780090332031, 0.10885238647460938, 0.11328697204589844, 0.1177215576171875, 0.12215614318847656, 0.12659072875976562, 0.1310253143310547, 0.13545989990234375, 0.1398944854736328, 0.14432907104492188, 0.14876365661621094, 0.1531982421875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 4.0, 1.0, 2.0, 11.0, 5.0, 5.0, 8.0, 11.0, 10.0, 9.0, 10.0, 12.0, 12.0, 23.0, 17.0, 31.0, 26.0, 43.0, 59.0, 43.0, 49.0, 47.0, 57.0, 47.0, 61.0, 47.0, 49.0, 49.0, 36.0, 32.0, 27.0, 25.0, 23.0, 21.0, 18.0, 20.0, 5.0, 12.0, 9.0, 6.0, 6.0, 5.0, 2.0, 5.0, 7.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.384765625, -2.303955078125, -2.22314453125, -2.142333984375, -2.0615234375, -1.980712890625, -1.89990234375, -1.819091796875, -1.73828125, -1.657470703125, -1.57666015625, -1.495849609375, -1.4150390625, -1.334228515625, -1.25341796875, -1.172607421875, -1.091796875, -1.010986328125, -0.93017578125, -0.849365234375, -0.7685546875, -0.687744140625, -0.60693359375, -0.526123046875, -0.4453125, -0.364501953125, -0.28369140625, -0.202880859375, -0.1220703125, -0.041259765625, 0.03955078125, 0.120361328125, 0.201171875, 0.281982421875, 0.36279296875, 0.443603515625, 0.5244140625, 0.605224609375, 0.68603515625, 0.766845703125, 0.84765625, 0.928466796875, 1.00927734375, 1.090087890625, 1.1708984375, 1.251708984375, 1.33251953125, 1.413330078125, 1.494140625, 1.574951171875, 1.65576171875, 1.736572265625, 1.8173828125, 1.898193359375, 1.97900390625, 2.059814453125, 2.140625, 2.221435546875, 2.30224609375, 2.383056640625, 2.4638671875, 2.544677734375, 2.62548828125, 2.706298828125, 2.787109375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 7.0, 0.0, 4.0, 8.0, 7.0, 11.0, 7.0, 15.0, 25.0, 24.0, 37.0, 34.0, 62.0, 87.0, 111.0, 271.0, 471.0, 991.0, 2387.0, 6361.0, 22725.0, 101018.0, 421420.0, 376333.0, 86539.0, 19529.0, 5918.0, 2069.0, 938.0, 480.0, 222.0, 138.0, 91.0, 59.0, 40.0, 30.0, 19.0, 14.0, 17.0, 9.0, 5.0, 7.0, 8.0, 3.0, 5.0, 4.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0611572265625, -0.05918121337890625, -0.0572052001953125, -0.05522918701171875, -0.053253173828125, -0.05127716064453125, -0.0493011474609375, -0.04732513427734375, -0.04534912109375, -0.04337310791015625, -0.0413970947265625, -0.03942108154296875, -0.037445068359375, -0.03546905517578125, -0.0334930419921875, -0.03151702880859375, -0.029541015625, -0.02756500244140625, -0.0255889892578125, -0.02361297607421875, -0.021636962890625, -0.01966094970703125, -0.0176849365234375, -0.01570892333984375, -0.01373291015625, -0.01175689697265625, -0.0097808837890625, -0.00780487060546875, -0.005828857421875, -0.00385284423828125, -0.0018768310546875, 9.918212890625e-05, 0.0020751953125, 0.00405120849609375, 0.0060272216796875, 0.00800323486328125, 0.009979248046875, 0.01195526123046875, 0.0139312744140625, 0.01590728759765625, 0.01788330078125, 0.01985931396484375, 0.0218353271484375, 0.02381134033203125, 0.025787353515625, 0.02776336669921875, 0.0297393798828125, 0.03171539306640625, 0.03369140625, 0.03566741943359375, 0.0376434326171875, 0.03961944580078125, 0.041595458984375, 0.04357147216796875, 0.0455474853515625, 0.04752349853515625, 0.04949951171875, 0.05147552490234375, 0.0534515380859375, 0.05542755126953125, 0.057403564453125, 0.05937957763671875, 0.0613555908203125, 0.06333160400390625, 0.0653076171875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 1.0, 3.0, 3.0, 7.0, 21.0, 18.0, 26.0, 31.0, 52.0, 64.0, 71.0, 141.0, 104.0, 132.0, 93.0, 61.0, 52.0, 31.0, 20.0, 26.0, 12.0, 10.0, 13.0, 5.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.459785461425781e-05, -5.317572504281998e-05, -5.175359547138214e-05, -5.0331465899944305e-05, -4.890933632850647e-05, -4.7487206757068634e-05, -4.60650771856308e-05, -4.464294761419296e-05, -4.322081804275513e-05, -4.179868847131729e-05, -4.0376558899879456e-05, -3.895442932844162e-05, -3.7532299757003784e-05, -3.611017018556595e-05, -3.468804061412811e-05, -3.326591104269028e-05, -3.184378147125244e-05, -3.0421651899814606e-05, -2.899952232837677e-05, -2.7577392756938934e-05, -2.61552631855011e-05, -2.4733133614063263e-05, -2.3311004042625427e-05, -2.188887447118759e-05, -2.0466744899749756e-05, -1.904461532831192e-05, -1.7622485756874084e-05, -1.620035618543625e-05, -1.4778226613998413e-05, -1.3356097042560577e-05, -1.1933967471122742e-05, -1.0511837899684906e-05, -9.08970832824707e-06, -7.667578756809235e-06, -6.245449185371399e-06, -4.823319613933563e-06, -3.4011900424957275e-06, -1.979060471057892e-06, -5.569308996200562e-07, 8.651986718177795e-07, 2.2873282432556152e-06, 3.709457814693451e-06, 5.131587386131287e-06, 6.553716957569122e-06, 7.975846529006958e-06, 9.397976100444794e-06, 1.082010567188263e-05, 1.2242235243320465e-05, 1.36643648147583e-05, 1.5086494386196136e-05, 1.6508623957633972e-05, 1.7930753529071808e-05, 1.9352883100509644e-05, 2.077501267194748e-05, 2.2197142243385315e-05, 2.361927181482315e-05, 2.5041401386260986e-05, 2.6463530957698822e-05, 2.7885660529136658e-05, 2.9307790100574493e-05, 3.072991967201233e-05, 3.2152049243450165e-05, 3.3574178814888e-05, 3.4996308386325836e-05, 3.641843795776367e-05]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 3.0, 9.0, 5.0, 11.0, 11.0, 26.0, 32.0, 51.0, 79.0, 142.0, 253.0, 452.0, 912.0, 1998.0, 4996.0, 14232.0, 52652.0, 231600.0, 514506.0, 168309.0, 39279.0, 11492.0, 4039.0, 1721.0, 784.0, 422.0, 213.0, 120.0, 72.0, 50.0, 28.0, 19.0, 7.0, 13.0, 6.0, 5.0, 4.0, 5.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.075927734375, -0.0736541748046875, -0.071380615234375, -0.0691070556640625, -0.06683349609375, -0.0645599365234375, -0.062286376953125, -0.0600128173828125, -0.0577392578125, -0.0554656982421875, -0.053192138671875, -0.0509185791015625, -0.04864501953125, -0.0463714599609375, -0.044097900390625, -0.0418243408203125, -0.03955078125, -0.0372772216796875, -0.035003662109375, -0.0327301025390625, -0.03045654296875, -0.0281829833984375, -0.025909423828125, -0.0236358642578125, -0.0213623046875, -0.0190887451171875, -0.016815185546875, -0.0145416259765625, -0.01226806640625, -0.0099945068359375, -0.007720947265625, -0.0054473876953125, -0.003173828125, -0.0009002685546875, 0.001373291015625, 0.0036468505859375, 0.00592041015625, 0.0081939697265625, 0.010467529296875, 0.0127410888671875, 0.0150146484375, 0.0172882080078125, 0.019561767578125, 0.0218353271484375, 0.02410888671875, 0.0263824462890625, 0.028656005859375, 0.0309295654296875, 0.033203125, 0.0354766845703125, 0.037750244140625, 0.0400238037109375, 0.04229736328125, 0.0445709228515625, 0.046844482421875, 0.0491180419921875, 0.0513916015625, 0.0536651611328125, 0.055938720703125, 0.0582122802734375, 0.06048583984375, 0.0627593994140625, 0.065032958984375, 0.0673065185546875, 0.069580078125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 9.0, 12.0, 14.0, 18.0, 20.0, 47.0, 35.0, 43.0, 53.0, 77.0, 100.0, 94.0, 93.0, 103.0, 66.0, 52.0, 43.0, 34.0, 19.0, 15.0, 3.0, 9.0, 13.0, 4.0, 1.0, 10.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.01702880859375, -0.01648569107055664, -0.01594257354736328, -0.015399456024169922, -0.014856338500976562, -0.014313220977783203, -0.013770103454589844, -0.013226985931396484, -0.012683868408203125, -0.012140750885009766, -0.011597633361816406, -0.011054515838623047, -0.010511398315429688, -0.009968280792236328, -0.009425163269042969, -0.00888204574584961, -0.00833892822265625, -0.007795810699462891, -0.007252693176269531, -0.006709575653076172, -0.0061664581298828125, -0.005623340606689453, -0.005080223083496094, -0.004537105560302734, -0.003993988037109375, -0.0034508705139160156, -0.0029077529907226562, -0.002364635467529297, -0.0018215179443359375, -0.0012784004211425781, -0.0007352828979492188, -0.00019216537475585938, 0.0003509521484375, 0.0008940696716308594, 0.0014371871948242188, 0.001980304718017578, 0.0025234222412109375, 0.003066539764404297, 0.0036096572875976562, 0.004152774810791016, 0.004695892333984375, 0.005239009857177734, 0.005782127380371094, 0.006325244903564453, 0.0068683624267578125, 0.007411479949951172, 0.007954597473144531, 0.00849771499633789, 0.00904083251953125, 0.00958395004272461, 0.010127067565917969, 0.010670185089111328, 0.011213302612304688, 0.011756420135498047, 0.012299537658691406, 0.012842655181884766, 0.013385772705078125, 0.013928890228271484, 0.014472007751464844, 0.015015125274658203, 0.015558242797851562, 0.016101360321044922, 0.01664447784423828, 0.01718759536743164, 0.017730712890625]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 12.0, 15.0, 17.0, 35.0, 40.0, 53.0, 69.0, 86.0, 100.0, 103.0, 80.0, 79.0, 81.0, 72.0, 47.0, 41.0, 25.0, 21.0, 8.0, 5.0, 4.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.608171820640564, -1.5410289764404297, -1.4738860130310059, -1.406743049621582, -1.3396002054214478, -1.2724573612213135, -1.2053143978118896, -1.1381714344024658, -1.0710285902023315, -1.0038857460021973, -0.9367427825927734, -0.8695998787879944, -0.8024569749832153, -0.7353140711784363, -0.6681711673736572, -0.6010282635688782, -0.5338853597640991, -0.46674245595932007, -0.399599552154541, -0.33245664834976196, -0.2653137445449829, -0.19817084074020386, -0.1310279369354248, -0.06388503313064575, 0.0032578706741333008, 0.07040077447891235, 0.1375436782836914, 0.20468658208847046, 0.2718294858932495, 0.33897238969802856, 0.4061152935028076, 0.47325819730758667, 0.5404009819030762, 0.6075438857078552, 0.6746867895126343, 0.7418296933174133, 0.8089725971221924, 0.8761155009269714, 0.9432584047317505, 1.0104012489318848, 1.0775442123413086, 1.1446871757507324, 1.2118300199508667, 1.278972864151001, 1.3461158275604248, 1.4132587909698486, 1.480401635169983, 1.5475444793701172, 1.614687442779541, 1.6818304061889648, 1.7489732503890991, 1.8161160945892334, 1.8832590579986572, 1.950402021408081, 2.017544746398926, 2.0846877098083496, 2.1518306732177734, 2.2189736366271973, 2.286116600036621, 2.353259325027466, 2.4204022884368896, 2.4875452518463135, 2.554687976837158, 2.621830940246582, 2.688973903656006]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 11.0, 5.0, 4.0, 9.0, 7.0, 11.0, 22.0, 15.0, 17.0, 20.0, 31.0, 25.0, 36.0, 33.0, 47.0, 42.0, 53.0, 43.0, 43.0, 42.0, 35.0, 40.0, 47.0, 29.0, 42.0, 34.0, 35.0, 29.0, 30.0, 33.0, 20.0, 15.0, 18.0, 16.0, 5.0, 9.0, 12.0, 11.0, 8.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.0681788921356201, -1.0322232246398926, -0.9962676763534546, -0.9603120684623718, -0.9243564605712891, -0.8884008526802063, -0.8524452447891235, -0.8164896368980408, -0.780534029006958, -0.7445784211158752, -0.7086228132247925, -0.6726672053337097, -0.636711597442627, -0.6007559895515442, -0.5648003816604614, -0.5288447737693787, -0.4928891658782959, -0.45693355798721313, -0.42097795009613037, -0.3850223422050476, -0.34906673431396484, -0.3131111264228821, -0.2771555185317993, -0.24119991064071655, -0.2052443027496338, -0.16928869485855103, -0.13333308696746826, -0.0973774790763855, -0.061421871185302734, -0.02546626329421997, 0.010489344596862793, 0.04644495248794556, 0.08240056037902832, 0.11835616827011108, 0.15431177616119385, 0.1902673840522766, 0.22622299194335938, 0.26217859983444214, 0.2981342077255249, 0.33408981561660767, 0.37004542350769043, 0.4060010313987732, 0.44195663928985596, 0.4779122471809387, 0.5138678550720215, 0.5498234629631042, 0.585779070854187, 0.6217346787452698, 0.6576902866363525, 0.6936458945274353, 0.7296015024185181, 0.7655571103096008, 0.8015127182006836, 0.8374683260917664, 0.8734239339828491, 0.9093795418739319, 0.9453351497650146, 0.9812907576560974, 1.0172463655471802, 1.0532019138336182, 1.0891575813293457, 1.1251132488250732, 1.1610687971115112, 1.1970243453979492, 1.2329800128936768]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 6.0, 2.0, 3.0, 8.0, 11.0, 21.0, 24.0, 27.0, 47.0, 69.0, 101.0, 134.0, 207.0, 400.0, 740.0, 1560.0, 3467.0, 8234.0, 21163.0, 56840.0, 153402.0, 360391.0, 275089.0, 102906.0, 38251.0, 14514.0, 5782.0, 2494.0, 1203.0, 578.0, 306.0, 188.0, 123.0, 87.0, 59.0, 34.0, 32.0, 19.0, 13.0, 7.0, 10.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5390625, -1.48370361328125, -1.4283447265625, -1.37298583984375, -1.317626953125, -1.26226806640625, -1.2069091796875, -1.15155029296875, -1.09619140625, -1.04083251953125, -0.9854736328125, -0.93011474609375, -0.874755859375, -0.81939697265625, -0.7640380859375, -0.70867919921875, -0.6533203125, -0.59796142578125, -0.5426025390625, -0.48724365234375, -0.431884765625, -0.37652587890625, -0.3211669921875, -0.26580810546875, -0.21044921875, -0.15509033203125, -0.0997314453125, -0.04437255859375, 0.010986328125, 0.06634521484375, 0.1217041015625, 0.17706298828125, 0.232421875, 0.28778076171875, 0.3431396484375, 0.39849853515625, 0.453857421875, 0.50921630859375, 0.5645751953125, 0.61993408203125, 0.67529296875, 0.73065185546875, 0.7860107421875, 0.84136962890625, 0.896728515625, 0.95208740234375, 1.0074462890625, 1.06280517578125, 1.1181640625, 1.17352294921875, 1.2288818359375, 1.28424072265625, 1.339599609375, 1.39495849609375, 1.4503173828125, 1.50567626953125, 1.56103515625, 1.61639404296875, 1.6717529296875, 1.72711181640625, 1.782470703125, 1.83782958984375, 1.8931884765625, 1.94854736328125, 2.00390625]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 7.0, 5.0, 8.0, 10.0, 13.0, 10.0, 9.0, 19.0, 17.0, 19.0, 26.0, 35.0, 41.0, 42.0, 52.0, 39.0, 53.0, 56.0, 57.0, 50.0, 42.0, 51.0, 42.0, 42.0, 35.0, 41.0, 25.0, 24.0, 26.0, 23.0, 15.0, 22.0, 7.0, 13.0, 8.0, 7.0, 5.0, 5.0, 4.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.19921875, -2.11737060546875, -2.0355224609375, -1.95367431640625, -1.871826171875, -1.78997802734375, -1.7081298828125, -1.62628173828125, -1.54443359375, -1.46258544921875, -1.3807373046875, -1.29888916015625, -1.217041015625, -1.13519287109375, -1.0533447265625, -0.97149658203125, -0.8896484375, -0.80780029296875, -0.7259521484375, -0.64410400390625, -0.562255859375, -0.48040771484375, -0.3985595703125, -0.31671142578125, -0.23486328125, -0.15301513671875, -0.0711669921875, 0.01068115234375, 0.092529296875, 0.17437744140625, 0.2562255859375, 0.33807373046875, 0.419921875, 0.50177001953125, 0.5836181640625, 0.66546630859375, 0.747314453125, 0.82916259765625, 0.9110107421875, 0.99285888671875, 1.07470703125, 1.15655517578125, 1.2384033203125, 1.32025146484375, 1.402099609375, 1.48394775390625, 1.5657958984375, 1.64764404296875, 1.7294921875, 1.81134033203125, 1.8931884765625, 1.97503662109375, 2.056884765625, 2.13873291015625, 2.2205810546875, 2.30242919921875, 2.38427734375, 2.46612548828125, 2.5479736328125, 2.62982177734375, 2.711669921875, 2.79351806640625, 2.8753662109375, 2.95721435546875, 3.0390625]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 2.0, 5.0, 5.0, 10.0, 11.0, 12.0, 17.0, 23.0, 29.0, 34.0, 56.0, 91.0, 129.0, 169.0, 198.0, 350.0, 695.0, 2087.0, 9873.0, 65462.0, 448964.0, 443468.0, 63445.0, 9697.0, 1999.0, 663.0, 361.0, 225.0, 123.0, 85.0, 87.0, 50.0, 43.0, 23.0, 25.0, 15.0, 9.0, 6.0, 3.0, 1.0, 0.0, 1.0, 5.0, 2.0, 4.0, 2.0], "bins": [-4.07421875, -3.9697265625, -3.865234375, -3.7607421875, -3.65625, -3.5517578125, -3.447265625, -3.3427734375, -3.23828125, -3.1337890625, -3.029296875, -2.9248046875, -2.8203125, -2.7158203125, -2.611328125, -2.5068359375, -2.40234375, -2.2978515625, -2.193359375, -2.0888671875, -1.984375, -1.8798828125, -1.775390625, -1.6708984375, -1.56640625, -1.4619140625, -1.357421875, -1.2529296875, -1.1484375, -1.0439453125, -0.939453125, -0.8349609375, -0.73046875, -0.6259765625, -0.521484375, -0.4169921875, -0.3125, -0.2080078125, -0.103515625, 0.0009765625, 0.10546875, 0.2099609375, 0.314453125, 0.4189453125, 0.5234375, 0.6279296875, 0.732421875, 0.8369140625, 0.94140625, 1.0458984375, 1.150390625, 1.2548828125, 1.359375, 1.4638671875, 1.568359375, 1.6728515625, 1.77734375, 1.8818359375, 1.986328125, 2.0908203125, 2.1953125, 2.2998046875, 2.404296875, 2.5087890625, 2.61328125]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 4.0, 2.0, 5.0, 5.0, 9.0, 7.0, 10.0, 7.0, 16.0, 17.0, 26.0, 24.0, 35.0, 36.0, 37.0, 50.0, 39.0, 62.0, 51.0, 51.0, 57.0, 56.0, 46.0, 44.0, 43.0, 54.0, 37.0, 37.0, 17.0, 24.0, 18.0, 26.0, 13.0, 9.0, 5.0, 5.0, 5.0, 5.0, 3.0, 5.0, 0.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.392578125, -3.293212890625, -3.19384765625, -3.094482421875, -2.9951171875, -2.895751953125, -2.79638671875, -2.697021484375, -2.59765625, -2.498291015625, -2.39892578125, -2.299560546875, -2.2001953125, -2.100830078125, -2.00146484375, -1.902099609375, -1.802734375, -1.703369140625, -1.60400390625, -1.504638671875, -1.4052734375, -1.305908203125, -1.20654296875, -1.107177734375, -1.0078125, -0.908447265625, -0.80908203125, -0.709716796875, -0.6103515625, -0.510986328125, -0.41162109375, -0.312255859375, -0.212890625, -0.113525390625, -0.01416015625, 0.085205078125, 0.1845703125, 0.283935546875, 0.38330078125, 0.482666015625, 0.58203125, 0.681396484375, 0.78076171875, 0.880126953125, 0.9794921875, 1.078857421875, 1.17822265625, 1.277587890625, 1.376953125, 1.476318359375, 1.57568359375, 1.675048828125, 1.7744140625, 1.873779296875, 1.97314453125, 2.072509765625, 2.171875, 2.271240234375, 2.37060546875, 2.469970703125, 2.5693359375, 2.668701171875, 2.76806640625, 2.867431640625, 2.966796875]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 2.0, 4.0, 3.0, 3.0, 4.0, 5.0, 8.0, 13.0, 19.0, 35.0, 58.0, 99.0, 311.0, 852.0, 3574.0, 31221.0, 592956.0, 393722.0, 21472.0, 2972.0, 719.0, 263.0, 106.0, 56.0, 27.0, 15.0, 14.0, 8.0, 4.0, 4.0, 2.0, 4.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.548828125, -1.5003204345703125, -1.451812744140625, -1.4033050537109375, -1.35479736328125, -1.3062896728515625, -1.257781982421875, -1.2092742919921875, -1.1607666015625, -1.1122589111328125, -1.063751220703125, -1.0152435302734375, -0.96673583984375, -0.9182281494140625, -0.869720458984375, -0.8212127685546875, -0.772705078125, -0.7241973876953125, -0.675689697265625, -0.6271820068359375, -0.57867431640625, -0.5301666259765625, -0.481658935546875, -0.4331512451171875, -0.3846435546875, -0.3361358642578125, -0.287628173828125, -0.2391204833984375, -0.19061279296875, -0.1421051025390625, -0.093597412109375, -0.0450897216796875, 0.00341796875, 0.0519256591796875, 0.100433349609375, 0.1489410400390625, 0.19744873046875, 0.2459564208984375, 0.294464111328125, 0.3429718017578125, 0.3914794921875, 0.4399871826171875, 0.488494873046875, 0.5370025634765625, 0.58551025390625, 0.6340179443359375, 0.682525634765625, 0.7310333251953125, 0.779541015625, 0.8280487060546875, 0.876556396484375, 0.9250640869140625, 0.97357177734375, 1.0220794677734375, 1.070587158203125, 1.1190948486328125, 1.1676025390625, 1.2161102294921875, 1.264617919921875, 1.3131256103515625, 1.36163330078125, 1.4101409912109375, 1.458648681640625, 1.5071563720703125, 1.5556640625]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 5.0, 7.0, 12.0, 18.0, 23.0, 27.0, 55.0, 69.0, 108.0, 162.0, 191.0, 92.0, 71.0, 48.0, 42.0, 29.0, 18.0, 1.0, 7.0, 4.0, 5.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002079010009765625, -0.00020099617540836334, -0.00019409134984016418, -0.00018718652427196503, -0.00018028169870376587, -0.0001733768731355667, -0.00016647204756736755, -0.0001595672219991684, -0.00015266239643096924, -0.00014575757086277008, -0.00013885274529457092, -0.00013194791972637177, -0.0001250430941581726, -0.00011813826858997345, -0.00011123344302177429, -0.00010432861745357513, -9.742379188537598e-05, -9.051896631717682e-05, -8.361414074897766e-05, -7.67093151807785e-05, -6.980448961257935e-05, -6.289966404438019e-05, -5.599483847618103e-05, -4.909001290798187e-05, -4.2185187339782715e-05, -3.528036177158356e-05, -2.83755362033844e-05, -2.1470710635185242e-05, -1.4565885066986084e-05, -7.661059498786926e-06, -7.562339305877686e-07, 6.148591637611389e-06, 1.3053417205810547e-05, 1.9958242774009705e-05, 2.6863068342208862e-05, 3.376789391040802e-05, 4.067271947860718e-05, 4.7577545046806335e-05, 5.448237061500549e-05, 6.138719618320465e-05, 6.829202175140381e-05, 7.519684731960297e-05, 8.210167288780212e-05, 8.900649845600128e-05, 9.591132402420044e-05, 0.0001028161495923996, 0.00010972097516059875, 0.00011662580072879791, 0.00012353062629699707, 0.00013043545186519623, 0.00013734027743339539, 0.00014424510300159454, 0.0001511499285697937, 0.00015805475413799286, 0.00016495957970619202, 0.00017186440527439117, 0.00017876923084259033, 0.0001856740564107895, 0.00019257888197898865, 0.0001994837075471878, 0.00020638853311538696, 0.00021329335868358612, 0.00022019818425178528, 0.00022710300981998444, 0.0002340078353881836]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 5.0, 4.0, 12.0, 19.0, 21.0, 53.0, 84.0, 141.0, 290.0, 516.0, 941.0, 1891.0, 5567.0, 29787.0, 259554.0, 628404.0, 101826.0, 13133.0, 3387.0, 1349.0, 678.0, 354.0, 211.0, 126.0, 67.0, 46.0, 39.0, 13.0, 8.0, 6.0, 5.0, 4.0, 4.0, 5.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2373046875, -1.19775390625, -1.158203125, -1.11865234375, -1.0791015625, -1.03955078125, -1.0, -0.96044921875, -0.9208984375, -0.88134765625, -0.841796875, -0.80224609375, -0.7626953125, -0.72314453125, -0.68359375, -0.64404296875, -0.6044921875, -0.56494140625, -0.525390625, -0.48583984375, -0.4462890625, -0.40673828125, -0.3671875, -0.32763671875, -0.2880859375, -0.24853515625, -0.208984375, -0.16943359375, -0.1298828125, -0.09033203125, -0.05078125, -0.01123046875, 0.0283203125, 0.06787109375, 0.107421875, 0.14697265625, 0.1865234375, 0.22607421875, 0.265625, 0.30517578125, 0.3447265625, 0.38427734375, 0.423828125, 0.46337890625, 0.5029296875, 0.54248046875, 0.58203125, 0.62158203125, 0.6611328125, 0.70068359375, 0.740234375, 0.77978515625, 0.8193359375, 0.85888671875, 0.8984375, 0.93798828125, 0.9775390625, 1.01708984375, 1.056640625, 1.09619140625, 1.1357421875, 1.17529296875, 1.21484375, 1.25439453125, 1.2939453125]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 7.0, 5.0, 9.0, 12.0, 10.0, 26.0, 21.0, 30.0, 55.0, 52.0, 58.0, 67.0, 117.0, 107.0, 94.0, 82.0, 68.0, 42.0, 35.0, 37.0, 23.0, 20.0, 8.0, 4.0, 3.0, 6.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.472412109375, -0.4576530456542969, -0.44289398193359375, -0.4281349182128906, -0.4133758544921875, -0.3986167907714844, -0.38385772705078125, -0.3690986633300781, -0.354339599609375, -0.3395805358886719, -0.32482147216796875, -0.3100624084472656, -0.2953033447265625, -0.2805442810058594, -0.26578521728515625, -0.2510261535644531, -0.23626708984375, -0.22150802612304688, -0.20674896240234375, -0.19198989868164062, -0.1772308349609375, -0.16247177124023438, -0.14771270751953125, -0.13295364379882812, -0.118194580078125, -0.10343551635742188, -0.08867645263671875, -0.07391738891601562, -0.0591583251953125, -0.044399261474609375, -0.02964019775390625, -0.014881134033203125, -0.0001220703125, 0.014636993408203125, 0.02939605712890625, 0.044155120849609375, 0.0589141845703125, 0.07367324829101562, 0.08843231201171875, 0.10319137573242188, 0.117950439453125, 0.13270950317382812, 0.14746856689453125, 0.16222763061523438, 0.1769866943359375, 0.19174575805664062, 0.20650482177734375, 0.22126388549804688, 0.23602294921875, 0.2507820129394531, 0.26554107666015625, 0.2803001403808594, 0.2950592041015625, 0.3098182678222656, 0.32457733154296875, 0.3393363952636719, 0.354095458984375, 0.3688545227050781, 0.38361358642578125, 0.3983726501464844, 0.4131317138671875, 0.4278907775878906, 0.44264984130859375, 0.4574089050292969, 0.47216796875]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [32.0, 188.0, 444.0, 265.0, 77.0, 8.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9749128818511963, -1.2551007270812988, -0.5352885723114014, 0.1845235824584961, 0.9043357372283936, 1.624147891998291, 2.3439600467681885, 3.063771963119507, 3.7835843563079834, 4.503396511077881, 5.223208427429199, 5.943020820617676, 6.662833213806152, 7.382645130157471, 8.102457046508789, 8.822269439697266, 9.542081832885742, 10.261894226074219, 10.981706619262695, 11.701518058776855, 12.421330451965332, 13.141142845153809, 13.860954284667969, 14.580766677856445, 15.300579071044922, 16.0203914642334, 16.740203857421875, 17.46001625061035, 18.179828643798828, 18.899639129638672, 19.61945152282715, 20.339263916015625, 21.05907440185547, 21.778886795043945, 22.498699188232422, 23.2185115814209, 23.938323974609375, 24.65813446044922, 25.377946853637695, 26.097759246826172, 26.81757164001465, 27.537384033203125, 28.2571964263916, 28.977008819580078, 29.696819305419922, 30.4166316986084, 31.136444091796875, 31.85625648498535, 32.57606887817383, 33.29587936401367, 34.01569366455078, 34.735504150390625, 35.455318450927734, 36.17512893676758, 36.89494323730469, 37.61475372314453, 38.334564208984375, 39.05437469482422, 39.77418899536133, 40.49399948120117, 41.21381378173828, 41.933624267578125, 42.653438568115234, 43.37324905395508, 44.09306335449219]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 6.0, 4.0, 3.0, 5.0, 7.0, 5.0, 6.0, 11.0, 17.0, 20.0, 14.0, 16.0, 23.0, 21.0, 28.0, 25.0, 34.0, 18.0, 33.0, 40.0, 46.0, 33.0, 43.0, 39.0, 45.0, 43.0, 27.0, 37.0, 34.0, 39.0, 43.0, 39.0, 29.0, 19.0, 22.0, 19.0, 22.0, 19.0, 12.0, 10.0, 10.0, 5.0, 6.0, 5.0, 4.0, 4.0, 4.0, 7.0, 4.0, 3.0, 2.0, 3.0], "bins": [-4.561337471008301, -4.434465408325195, -4.307592868804932, -4.180720806121826, -4.053848743438721, -3.926976442337036, -3.8001041412353516, -3.673232078552246, -3.5463597774505615, -3.419487476348877, -3.2926154136657715, -3.165743112564087, -3.0388708114624023, -2.911998748779297, -2.7851264476776123, -2.6582541465759277, -2.5313820838928223, -2.4045097827911377, -2.2776377201080322, -2.1507654190063477, -2.023893356323242, -1.8970210552215576, -1.770148754119873, -1.643276572227478, -1.516404390335083, -1.389532208442688, -1.262660026550293, -1.1357877254486084, -1.0089155435562134, -0.8820433616638184, -0.7551711201667786, -0.6282988786697388, -0.501427173614502, -0.37455496191978455, -0.24768275022506714, -0.12081053853034973, 0.006061673164367676, 0.1329338550567627, 0.2598060965538025, 0.3866783380508423, 0.5135505199432373, 0.6404227018356323, 0.7672949433326721, 0.8941671848297119, 1.021039366722107, 1.147911548614502, 1.2747838497161865, 1.4016560316085815, 1.5285282135009766, 1.6554003953933716, 1.7822725772857666, 1.9091448783874512, 2.0360169410705566, 2.162889242172241, 2.289761543273926, 2.4166336059570312, 2.543505907058716, 2.6703782081604004, 2.797250270843506, 2.9241225719451904, 3.050994873046875, 3.1778669357299805, 3.304739236831665, 3.4316115379333496, 3.558483600616455]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 3.0, 0.0, 4.0, 1.0, 6.0, 6.0, 5.0, 8.0, 4.0, 9.0, 9.0, 14.0, 12.0, 15.0, 14.0, 31.0, 39.0, 41.0, 41.0, 88.0, 162.0, 232.0, 444.0, 1052.0, 3105.0, 12324.0, 74043.0, 783381.0, 2741721.0, 512811.0, 51192.0, 8957.0, 2412.0, 974.0, 405.0, 228.0, 145.0, 80.0, 56.0, 50.0, 35.0, 25.0, 18.0, 13.0, 22.0, 11.0, 7.0, 5.0, 4.0, 5.0, 3.0, 8.0, 3.0, 5.0, 2.0, 1.0, 3.0], "bins": [-3.546875, -3.44671630859375, -3.3465576171875, -3.24639892578125, -3.146240234375, -3.04608154296875, -2.9459228515625, -2.84576416015625, -2.74560546875, -2.64544677734375, -2.5452880859375, -2.44512939453125, -2.344970703125, -2.24481201171875, -2.1446533203125, -2.04449462890625, -1.9443359375, -1.84417724609375, -1.7440185546875, -1.64385986328125, -1.543701171875, -1.44354248046875, -1.3433837890625, -1.24322509765625, -1.14306640625, -1.04290771484375, -0.9427490234375, -0.84259033203125, -0.742431640625, -0.64227294921875, -0.5421142578125, -0.44195556640625, -0.341796875, -0.24163818359375, -0.1414794921875, -0.04132080078125, 0.058837890625, 0.15899658203125, 0.2591552734375, 0.35931396484375, 0.45947265625, 0.55963134765625, 0.6597900390625, 0.75994873046875, 0.860107421875, 0.96026611328125, 1.0604248046875, 1.16058349609375, 1.2607421875, 1.36090087890625, 1.4610595703125, 1.56121826171875, 1.661376953125, 1.76153564453125, 1.8616943359375, 1.96185302734375, 2.06201171875, 2.16217041015625, 2.2623291015625, 2.36248779296875, 2.462646484375, 2.56280517578125, 2.6629638671875, 2.76312255859375, 2.86328125]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0, 5.0, 3.0, 7.0, 5.0, 11.0, 9.0, 9.0, 18.0, 16.0, 26.0, 17.0, 23.0, 36.0, 47.0, 42.0, 43.0, 46.0, 45.0, 43.0, 43.0, 58.0, 44.0, 40.0, 39.0, 51.0, 32.0, 43.0, 30.0, 36.0, 19.0, 24.0, 17.0, 12.0, 17.0, 11.0, 11.0, 10.0, 4.0, 6.0, 5.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3291015625, -1.28369140625, -1.23828125, -1.19287109375, -1.1474609375, -1.10205078125, -1.056640625, -1.01123046875, -0.9658203125, -0.92041015625, -0.875, -0.82958984375, -0.7841796875, -0.73876953125, -0.693359375, -0.64794921875, -0.6025390625, -0.55712890625, -0.51171875, -0.46630859375, -0.4208984375, -0.37548828125, -0.330078125, -0.28466796875, -0.2392578125, -0.19384765625, -0.1484375, -0.10302734375, -0.0576171875, -0.01220703125, 0.033203125, 0.07861328125, 0.1240234375, 0.16943359375, 0.21484375, 0.26025390625, 0.3056640625, 0.35107421875, 0.396484375, 0.44189453125, 0.4873046875, 0.53271484375, 0.578125, 0.62353515625, 0.6689453125, 0.71435546875, 0.759765625, 0.80517578125, 0.8505859375, 0.89599609375, 0.94140625, 0.98681640625, 1.0322265625, 1.07763671875, 1.123046875, 1.16845703125, 1.2138671875, 1.25927734375, 1.3046875, 1.35009765625, 1.3955078125, 1.44091796875, 1.486328125, 1.53173828125, 1.5771484375]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 6.0, 9.0, 6.0, 25.0, 43.0, 79.0, 162.0, 439.0, 1020.0, 3832.0, 56127.0, 3874996.0, 248223.0, 6838.0, 1478.0, 577.0, 237.0, 81.0, 40.0, 19.0, 11.0, 7.0, 9.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.09765625, -6.8734130859375, -6.649169921875, -6.4249267578125, -6.20068359375, -5.9764404296875, -5.752197265625, -5.5279541015625, -5.3037109375, -5.0794677734375, -4.855224609375, -4.6309814453125, -4.40673828125, -4.1824951171875, -3.958251953125, -3.7340087890625, -3.509765625, -3.2855224609375, -3.061279296875, -2.8370361328125, -2.61279296875, -2.3885498046875, -2.164306640625, -1.9400634765625, -1.7158203125, -1.4915771484375, -1.267333984375, -1.0430908203125, -0.81884765625, -0.5946044921875, -0.370361328125, -0.1461181640625, 0.078125, 0.3023681640625, 0.526611328125, 0.7508544921875, 0.97509765625, 1.1993408203125, 1.423583984375, 1.6478271484375, 1.8720703125, 2.0963134765625, 2.320556640625, 2.5447998046875, 2.76904296875, 2.9932861328125, 3.217529296875, 3.4417724609375, 3.666015625, 3.8902587890625, 4.114501953125, 4.3387451171875, 4.56298828125, 4.7872314453125, 5.011474609375, 5.2357177734375, 5.4599609375, 5.6842041015625, 5.908447265625, 6.1326904296875, 6.35693359375, 6.5811767578125, 6.805419921875, 7.0296630859375, 7.25390625]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 3.0, 4.0, 9.0, 4.0, 19.0, 16.0, 36.0, 54.0, 100.0, 131.0, 221.0, 363.0, 474.0, 660.0, 606.0, 484.0, 330.0, 194.0, 127.0, 98.0, 46.0, 29.0, 19.0, 18.0, 14.0, 8.0, 3.0, 1.0, 3.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1357421875, -1.099029541015625, -1.06231689453125, -1.025604248046875, -0.9888916015625, -0.952178955078125, -0.91546630859375, -0.878753662109375, -0.842041015625, -0.805328369140625, -0.76861572265625, -0.731903076171875, -0.6951904296875, -0.658477783203125, -0.62176513671875, -0.585052490234375, -0.54833984375, -0.511627197265625, -0.47491455078125, -0.438201904296875, -0.4014892578125, -0.364776611328125, -0.32806396484375, -0.291351318359375, -0.254638671875, -0.217926025390625, -0.18121337890625, -0.144500732421875, -0.1077880859375, -0.071075439453125, -0.03436279296875, 0.002349853515625, 0.0390625, 0.075775146484375, 0.11248779296875, 0.149200439453125, 0.1859130859375, 0.222625732421875, 0.25933837890625, 0.296051025390625, 0.332763671875, 0.369476318359375, 0.40618896484375, 0.442901611328125, 0.4796142578125, 0.516326904296875, 0.55303955078125, 0.589752197265625, 0.62646484375, 0.663177490234375, 0.69989013671875, 0.736602783203125, 0.7733154296875, 0.810028076171875, 0.84674072265625, 0.883453369140625, 0.920166015625, 0.956878662109375, 0.99359130859375, 1.030303955078125, 1.0670166015625, 1.103729248046875, 1.14044189453125, 1.177154541015625, 1.2138671875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 6.0, 6.0, 4.0, 13.0, 14.0, 13.0, 17.0, 15.0, 29.0, 25.0, 35.0, 31.0, 45.0, 44.0, 45.0, 49.0, 55.0, 40.0, 46.0, 57.0, 49.0, 44.0, 45.0, 57.0, 43.0, 27.0, 32.0, 23.0, 25.0, 21.0, 14.0, 6.0, 11.0, 6.0, 6.0, 4.0, 2.0, 6.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7463939189910889, -1.6785998344421387, -1.610805869102478, -1.5430117845535278, -1.4752177000045776, -1.407423734664917, -1.3396296501159668, -1.2718355655670166, -1.2040414810180664, -1.1362473964691162, -1.0684534311294556, -1.0006593465805054, -0.9328652620315552, -0.8650712370872498, -0.7972772121429443, -0.7294831275939941, -0.6616891622543335, -0.5938951373100281, -0.5261010527610779, -0.45830702781677246, -0.39051297307014465, -0.32271891832351685, -0.2549248933792114, -0.18713083863258362, -0.11933678388595581, -0.0515427365899086, 0.01625131070613861, 0.08404535055160522, 0.15183940529823303, 0.21963346004486084, 0.28742748498916626, 0.35522153973579407, 0.4230155944824219, 0.4908096492290497, 0.5586037039756775, 0.6263977289199829, 0.6941918134689331, 0.7619858384132385, 0.829779863357544, 0.8975739479064941, 0.9653679728507996, 1.033161997795105, 1.1009560823440552, 1.1687500476837158, 1.236544132232666, 1.3043382167816162, 1.3721323013305664, 1.439926266670227, 1.5077203512191772, 1.5755144357681274, 1.643308401107788, 1.7111024856567383, 1.7788965702056885, 1.8466906547546387, 1.9144846200942993, 1.9822787046432495, 2.05007266998291, 2.1178667545318604, 2.1856608390808105, 2.2534546852111816, 2.321248769760132, 2.389042854309082, 2.4568369388580322, 2.5246310234069824, 2.5924251079559326]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 4.0, 5.0, 2.0, 16.0, 4.0, 11.0, 13.0, 12.0, 18.0, 16.0, 19.0, 28.0, 29.0, 35.0, 40.0, 32.0, 42.0, 38.0, 53.0, 32.0, 51.0, 52.0, 41.0, 45.0, 39.0, 36.0, 30.0, 34.0, 29.0, 36.0, 26.0, 21.0, 24.0, 22.0, 11.0, 12.0, 7.0, 9.0, 9.0, 7.0, 3.0, 10.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8354744911193848, -1.7747690677642822, -1.7140636444091797, -1.6533582210540771, -1.5926527976989746, -1.531947374343872, -1.4712419509887695, -1.410536527633667, -1.3498311042785645, -1.289125680923462, -1.2284202575683594, -1.1677148342132568, -1.1070094108581543, -1.0463039875030518, -0.985598623752594, -0.9248932003974915, -0.8641878366470337, -0.8034824132919312, -0.7427769899368286, -0.6820715665817261, -0.6213661432266235, -0.560660719871521, -0.49995535612106323, -0.4392499327659607, -0.37854450941085815, -0.3178390860557556, -0.2571336627006531, -0.19642826914787292, -0.13572284579277039, -0.07501742243766785, -0.014312028884887695, 0.046393394470214844, 0.10709881782531738, 0.16780424118041992, 0.22850964963436127, 0.2892150580883026, 0.34992048144340515, 0.4106259047985077, 0.47133129835128784, 0.5320367217063904, 0.5927421450614929, 0.6534475684165955, 0.714152991771698, 0.7748583555221558, 0.8355637788772583, 0.8962692022323608, 0.9569746255874634, 1.017680048942566, 1.0783854722976685, 1.139090895652771, 1.1997963190078735, 1.260501742362976, 1.3212071657180786, 1.3819125890731812, 1.4426178932189941, 1.5033233165740967, 1.5640287399291992, 1.6247341632843018, 1.6854395866394043, 1.7461450099945068, 1.8068504333496094, 1.867555856704712, 1.9282612800598145, 1.988966703414917, 2.0496721267700195]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 6.0, 3.0, 6.0, 7.0, 8.0, 18.0, 12.0, 16.0, 31.0, 40.0, 40.0, 49.0, 80.0, 96.0, 116.0, 173.0, 258.0, 356.0, 671.0, 1532.0, 5076.0, 24704.0, 151521.0, 532366.0, 272644.0, 45690.0, 8434.0, 2223.0, 842.0, 445.0, 296.0, 200.0, 147.0, 96.0, 94.0, 66.0, 37.0, 46.0, 27.0, 18.0, 11.0, 16.0, 13.0, 10.0, 6.0, 5.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.7099609375, -0.6875457763671875, -0.665130615234375, -0.6427154541015625, -0.62030029296875, -0.5978851318359375, -0.575469970703125, -0.5530548095703125, -0.5306396484375, -0.5082244873046875, -0.485809326171875, -0.4633941650390625, -0.44097900390625, -0.4185638427734375, -0.396148681640625, -0.3737335205078125, -0.351318359375, -0.3289031982421875, -0.306488037109375, -0.2840728759765625, -0.26165771484375, -0.2392425537109375, -0.216827392578125, -0.1944122314453125, -0.1719970703125, -0.1495819091796875, -0.127166748046875, -0.1047515869140625, -0.08233642578125, -0.0599212646484375, -0.037506103515625, -0.0150909423828125, 0.00732421875, 0.0297393798828125, 0.052154541015625, 0.0745697021484375, 0.09698486328125, 0.1194000244140625, 0.141815185546875, 0.1642303466796875, 0.1866455078125, 0.2090606689453125, 0.231475830078125, 0.2538909912109375, 0.27630615234375, 0.2987213134765625, 0.321136474609375, 0.3435516357421875, 0.365966796875, 0.3883819580078125, 0.410797119140625, 0.4332122802734375, 0.45562744140625, 0.4780426025390625, 0.500457763671875, 0.5228729248046875, 0.5452880859375, 0.5677032470703125, 0.590118408203125, 0.6125335693359375, 0.63494873046875, 0.6573638916015625, 0.679779052734375, 0.7021942138671875, 0.724609375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 3.0, 5.0, 10.0, 9.0, 8.0, 8.0, 8.0, 11.0, 18.0, 11.0, 24.0, 24.0, 28.0, 27.0, 33.0, 36.0, 33.0, 34.0, 39.0, 33.0, 51.0, 29.0, 40.0, 37.0, 43.0, 42.0, 37.0, 37.0, 28.0, 35.0, 27.0, 30.0, 22.0, 27.0, 15.0, 16.0, 17.0, 15.0, 5.0, 6.0, 10.0, 12.0, 6.0, 4.0, 4.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.189453125, -1.1529083251953125, -1.116363525390625, -1.0798187255859375, -1.04327392578125, -1.0067291259765625, -0.970184326171875, -0.9336395263671875, -0.8970947265625, -0.8605499267578125, -0.824005126953125, -0.7874603271484375, -0.75091552734375, -0.7143707275390625, -0.677825927734375, -0.6412811279296875, -0.604736328125, -0.5681915283203125, -0.531646728515625, -0.4951019287109375, -0.45855712890625, -0.4220123291015625, -0.385467529296875, -0.3489227294921875, -0.3123779296875, -0.2758331298828125, -0.239288330078125, -0.2027435302734375, -0.16619873046875, -0.1296539306640625, -0.093109130859375, -0.0565643310546875, -0.02001953125, 0.0165252685546875, 0.053070068359375, 0.0896148681640625, 0.12615966796875, 0.1627044677734375, 0.199249267578125, 0.2357940673828125, 0.2723388671875, 0.3088836669921875, 0.345428466796875, 0.3819732666015625, 0.41851806640625, 0.4550628662109375, 0.491607666015625, 0.5281524658203125, 0.564697265625, 0.6012420654296875, 0.637786865234375, 0.6743316650390625, 0.71087646484375, 0.7474212646484375, 0.783966064453125, 0.8205108642578125, 0.8570556640625, 0.8936004638671875, 0.930145263671875, 0.9666900634765625, 1.00323486328125, 1.0397796630859375, 1.076324462890625, 1.1128692626953125, 1.1494140625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 1.0, 3.0, 4.0, 3.0, 10.0, 15.0, 16.0, 24.0, 30.0, 48.0, 74.0, 104.0, 160.0, 264.0, 417.0, 626.0, 924.0, 1522.0, 2458.0, 4009.0, 6354.0, 10138.0, 16767.0, 27884.0, 46265.0, 76014.0, 117751.0, 160462.0, 173274.0, 144591.0, 99211.0, 62356.0, 37745.0, 22874.0, 13783.0, 8311.0, 5141.0, 3243.0, 2059.0, 1314.0, 800.0, 555.0, 328.0, 201.0, 134.0, 104.0, 67.0, 38.0, 35.0, 16.0, 17.0, 9.0, 5.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1829833984375, -0.17713546752929688, -0.17128753662109375, -0.16543960571289062, -0.1595916748046875, -0.15374374389648438, -0.14789581298828125, -0.14204788208007812, -0.136199951171875, -0.13035202026367188, -0.12450408935546875, -0.11865615844726562, -0.1128082275390625, -0.10696029663085938, -0.10111236572265625, -0.09526443481445312, -0.08941650390625, -0.08356857299804688, -0.07772064208984375, -0.07187271118164062, -0.0660247802734375, -0.060176849365234375, -0.05432891845703125, -0.048480987548828125, -0.042633056640625, -0.036785125732421875, -0.03093719482421875, -0.025089263916015625, -0.0192413330078125, -0.013393402099609375, -0.00754547119140625, -0.001697540283203125, 0.004150390625, 0.009998321533203125, 0.01584625244140625, 0.021694183349609375, 0.0275421142578125, 0.033390045166015625, 0.03923797607421875, 0.045085906982421875, 0.050933837890625, 0.056781768798828125, 0.06262969970703125, 0.06847763061523438, 0.0743255615234375, 0.08017349243164062, 0.08602142333984375, 0.09186935424804688, 0.09771728515625, 0.10356521606445312, 0.10941314697265625, 0.11526107788085938, 0.1211090087890625, 0.12695693969726562, 0.13280487060546875, 0.13865280151367188, 0.144500732421875, 0.15034866333007812, 0.15619659423828125, 0.16204452514648438, 0.1678924560546875, 0.17374038696289062, 0.17958831787109375, 0.18543624877929688, 0.1912841796875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 10.0, 11.0, 9.0, 8.0, 9.0, 13.0, 16.0, 22.0, 30.0, 18.0, 34.0, 26.0, 32.0, 33.0, 44.0, 45.0, 49.0, 47.0, 54.0, 60.0, 42.0, 37.0, 48.0, 35.0, 36.0, 40.0, 25.0, 29.0, 16.0, 14.0, 12.0, 23.0, 17.0, 9.0, 6.0, 7.0, 5.0, 5.0, 7.0, 7.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.07421875, -2.975982666015625, -2.87774658203125, -2.779510498046875, -2.6812744140625, -2.583038330078125, -2.48480224609375, -2.386566162109375, -2.288330078125, -2.190093994140625, -2.09185791015625, -1.993621826171875, -1.8953857421875, -1.797149658203125, -1.69891357421875, -1.600677490234375, -1.50244140625, -1.404205322265625, -1.30596923828125, -1.207733154296875, -1.1094970703125, -1.011260986328125, -0.91302490234375, -0.814788818359375, -0.716552734375, -0.618316650390625, -0.52008056640625, -0.421844482421875, -0.3236083984375, -0.225372314453125, -0.12713623046875, -0.028900146484375, 0.0693359375, 0.167572021484375, 0.26580810546875, 0.364044189453125, 0.4622802734375, 0.560516357421875, 0.65875244140625, 0.756988525390625, 0.855224609375, 0.953460693359375, 1.05169677734375, 1.149932861328125, 1.2481689453125, 1.346405029296875, 1.44464111328125, 1.542877197265625, 1.64111328125, 1.739349365234375, 1.83758544921875, 1.935821533203125, 2.0340576171875, 2.132293701171875, 2.23052978515625, 2.328765869140625, 2.427001953125, 2.525238037109375, 2.62347412109375, 2.721710205078125, 2.8199462890625, 2.918182373046875, 3.01641845703125, 3.114654541015625, 3.212890625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 6.0, 9.0, 9.0, 18.0, 23.0, 48.0, 84.0, 119.0, 172.0, 305.0, 497.0, 833.0, 1946.0, 6050.0, 38631.0, 401246.0, 527401.0, 58638.0, 7983.0, 2241.0, 949.0, 532.0, 290.0, 171.0, 131.0, 86.0, 48.0, 27.0, 16.0, 20.0, 9.0, 7.0, 7.0, 6.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.107421875, -0.10345649719238281, -0.09949111938476562, -0.09552574157714844, -0.09156036376953125, -0.08759498596191406, -0.08362960815429688, -0.07966423034667969, -0.0756988525390625, -0.07173347473144531, -0.06776809692382812, -0.06380271911621094, -0.05983734130859375, -0.05587196350097656, -0.051906585693359375, -0.04794120788574219, -0.043975830078125, -0.04001045227050781, -0.036045074462890625, -0.03207969665527344, -0.02811431884765625, -0.024148941040039062, -0.020183563232421875, -0.016218185424804688, -0.0122528076171875, -0.008287429809570312, -0.004322052001953125, -0.0003566741943359375, 0.00360870361328125, 0.0075740814208984375, 0.011539459228515625, 0.015504837036132812, 0.01947021484375, 0.023435592651367188, 0.027400970458984375, 0.03136634826660156, 0.03533172607421875, 0.03929710388183594, 0.043262481689453125, 0.04722785949707031, 0.0511932373046875, 0.05515861511230469, 0.059123992919921875, 0.06308937072753906, 0.06705474853515625, 0.07102012634277344, 0.07498550415039062, 0.07895088195800781, 0.082916259765625, 0.08688163757324219, 0.09084701538085938, 0.09481239318847656, 0.09877777099609375, 0.10274314880371094, 0.10670852661132812, 0.11067390441894531, 0.1146392822265625, 0.11860466003417969, 0.12257003784179688, 0.12653541564941406, 0.13050079345703125, 0.13446617126464844, 0.13843154907226562, 0.1423969268798828, 0.1463623046875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 11.0, 27.0, 29.0, 71.0, 113.0, 146.0, 166.0, 146.0, 118.0, 76.0, 45.0, 23.0, 14.0, 10.0, 3.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0001043081283569336, -0.00010160915553569794, -9.891018271446228e-05, -9.621120989322662e-05, -9.351223707199097e-05, -9.081326425075531e-05, -8.811429142951965e-05, -8.5415318608284e-05, -8.271634578704834e-05, -8.001737296581268e-05, -7.731840014457703e-05, -7.461942732334137e-05, -7.192045450210571e-05, -6.922148168087006e-05, -6.65225088596344e-05, -6.382353603839874e-05, -6.112456321716309e-05, -5.842559039592743e-05, -5.572661757469177e-05, -5.3027644753456116e-05, -5.032867193222046e-05, -4.76296991109848e-05, -4.4930726289749146e-05, -4.223175346851349e-05, -3.953278064727783e-05, -3.6833807826042175e-05, -3.413483500480652e-05, -3.143586218357086e-05, -2.8736889362335205e-05, -2.603791654109955e-05, -2.333894371986389e-05, -2.0639970898628235e-05, -1.7940998077392578e-05, -1.5242025256156921e-05, -1.2543052434921265e-05, -9.844079613685608e-06, -7.145106792449951e-06, -4.4461339712142944e-06, -1.7471611499786377e-06, 9.51811671257019e-07, 3.6507844924926758e-06, 6.3497573137283325e-06, 9.04873013496399e-06, 1.1747702956199646e-05, 1.4446675777435303e-05, 1.714564859867096e-05, 1.9844621419906616e-05, 2.2543594241142273e-05, 2.524256706237793e-05, 2.7941539883613586e-05, 3.064051270484924e-05, 3.33394855260849e-05, 3.603845834732056e-05, 3.873743116855621e-05, 4.143640398979187e-05, 4.413537681102753e-05, 4.6834349632263184e-05, 4.953332245349884e-05, 5.22322952747345e-05, 5.4931268095970154e-05, 5.763024091720581e-05, 6.032921373844147e-05, 6.302818655967712e-05, 6.572715938091278e-05, 6.842613220214844e-05]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 9.0, 3.0, 24.0, 25.0, 46.0, 56.0, 105.0, 157.0, 300.0, 494.0, 960.0, 1662.0, 3381.0, 6816.0, 15008.0, 35784.0, 94088.0, 242555.0, 350005.0, 180454.0, 67730.0, 26313.0, 11214.0, 5330.0, 2578.0, 1394.0, 845.0, 457.0, 284.0, 162.0, 103.0, 76.0, 51.0, 27.0, 18.0, 12.0, 10.0, 6.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.07366943359375, -0.07152271270751953, -0.06937599182128906, -0.0672292709350586, -0.06508255004882812, -0.06293582916259766, -0.06078910827636719, -0.05864238739013672, -0.05649566650390625, -0.05434894561767578, -0.05220222473144531, -0.050055503845214844, -0.047908782958984375, -0.045762062072753906, -0.04361534118652344, -0.04146862030029297, -0.0393218994140625, -0.03717517852783203, -0.03502845764160156, -0.032881736755371094, -0.030735015869140625, -0.028588294982910156, -0.026441574096679688, -0.02429485321044922, -0.02214813232421875, -0.02000141143798828, -0.017854690551757812, -0.015707969665527344, -0.013561248779296875, -0.011414527893066406, -0.009267807006835938, -0.007121086120605469, -0.004974365234375, -0.0028276443481445312, -0.0006809234619140625, 0.0014657974243164062, 0.003612518310546875, 0.005759239196777344, 0.007905960083007812, 0.010052680969238281, 0.01219940185546875, 0.014346122741699219, 0.016492843627929688, 0.018639564514160156, 0.020786285400390625, 0.022933006286621094, 0.025079727172851562, 0.02722644805908203, 0.0293731689453125, 0.03151988983154297, 0.03366661071777344, 0.035813331604003906, 0.037960052490234375, 0.040106773376464844, 0.04225349426269531, 0.04440021514892578, 0.04654693603515625, 0.04869365692138672, 0.05084037780761719, 0.052987098693847656, 0.055133819580078125, 0.057280540466308594, 0.05942726135253906, 0.06157398223876953, 0.063720703125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 5.0, 8.0, 8.0, 11.0, 11.0, 19.0, 18.0, 21.0, 36.0, 45.0, 50.0, 67.0, 76.0, 106.0, 98.0, 86.0, 97.0, 65.0, 40.0, 24.0, 13.0, 23.0, 11.0, 10.0, 4.0, 11.0, 6.0, 7.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.027587890625, -0.02662515640258789, -0.02566242218017578, -0.024699687957763672, -0.023736953735351562, -0.022774219512939453, -0.021811485290527344, -0.020848751068115234, -0.019886016845703125, -0.018923282623291016, -0.017960548400878906, -0.016997814178466797, -0.016035079956054688, -0.015072345733642578, -0.014109611511230469, -0.01314687728881836, -0.01218414306640625, -0.01122140884399414, -0.010258674621582031, -0.009295940399169922, -0.008333206176757812, -0.007370471954345703, -0.006407737731933594, -0.005445003509521484, -0.004482269287109375, -0.0035195350646972656, -0.0025568008422851562, -0.0015940666198730469, -0.0006313323974609375, 0.0003314018249511719, 0.0012941360473632812, 0.0022568702697753906, 0.0032196044921875, 0.004182338714599609, 0.005145072937011719, 0.006107807159423828, 0.0070705413818359375, 0.008033275604248047, 0.008996009826660156, 0.009958744049072266, 0.010921478271484375, 0.011884212493896484, 0.012846946716308594, 0.013809680938720703, 0.014772415161132812, 0.015735149383544922, 0.01669788360595703, 0.01766061782836914, 0.01862335205078125, 0.01958608627319336, 0.02054882049560547, 0.021511554718017578, 0.022474288940429688, 0.023437023162841797, 0.024399757385253906, 0.025362491607666016, 0.026325225830078125, 0.027287960052490234, 0.028250694274902344, 0.029213428497314453, 0.030176162719726562, 0.031138896942138672, 0.03210163116455078, 0.03306436538696289, 0.034027099609375]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 10.0, 14.0, 19.0, 20.0, 26.0, 40.0, 34.0, 51.0, 52.0, 48.0, 56.0, 55.0, 69.0, 56.0, 64.0, 65.0, 39.0, 48.0, 60.0, 48.0, 34.0, 27.0, 16.0, 14.0, 9.0, 15.0, 4.0, 2.0, 0.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0538415908813477, -1.0038965940475464, -0.9539515972137451, -0.9040066003799438, -0.8540616035461426, -0.8041166067123413, -0.7541716694831848, -0.7042266726493835, -0.6542816758155823, -0.604336678981781, -0.5543916821479797, -0.5044467449188232, -0.4545017182826996, -0.4045567214488983, -0.35461175441741943, -0.30466675758361816, -0.2547217607498169, -0.20477676391601562, -0.15483178198337555, -0.10488680005073547, -0.054941803216934204, -0.004996806383132935, 0.04494816064834595, 0.09489315748214722, 0.1448381543159485, 0.19478315114974976, 0.24472813308238983, 0.2946731150150299, 0.3446181118488312, 0.39456310868263245, 0.44450807571411133, 0.4944530725479126, 0.5443980693817139, 0.5943430662155151, 0.6442880630493164, 0.6942330598831177, 0.744178056716919, 0.7941230535507202, 0.8440679907798767, 0.894012987613678, 0.9439579844474792, 0.9939029812812805, 1.043847918510437, 1.0937929153442383, 1.1437379121780396, 1.1936829090118408, 1.243627905845642, 1.2935729026794434, 1.3435178995132446, 1.393462896347046, 1.4434078931808472, 1.4933528900146484, 1.5432978868484497, 1.593242883682251, 1.6431877613067627, 1.6931328773498535, 1.7430777549743652, 1.7930227518081665, 1.8429677486419678, 1.892912745475769, 1.9428577423095703, 1.9928027391433716, 2.042747735977173, 2.0926926136016846, 2.1426377296447754]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 5.0, 4.0, 9.0, 6.0, 6.0, 9.0, 11.0, 16.0, 20.0, 15.0, 17.0, 29.0, 28.0, 40.0, 41.0, 44.0, 36.0, 43.0, 50.0, 50.0, 42.0, 59.0, 46.0, 44.0, 39.0, 42.0, 27.0, 35.0, 27.0, 32.0, 26.0, 21.0, 17.0, 14.0, 10.0, 14.0, 3.0, 9.0, 6.0, 10.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1705529689788818, -1.1307274103164673, -1.0909018516540527, -1.0510761737823486, -1.011250615119934, -0.9714250564575195, -0.931599497795105, -0.8917739391326904, -0.8519483208656311, -0.8121227622032166, -0.7722971439361572, -0.7324715852737427, -0.6926460266113281, -0.6528204083442688, -0.6129948496818542, -0.5731692314147949, -0.5333436727523804, -0.49351808428764343, -0.4536924958229065, -0.41386693716049194, -0.374041348695755, -0.33421576023101807, -0.2943902015686035, -0.2545646131038666, -0.21473902463912964, -0.1749134361743927, -0.13508786261081696, -0.09526228159666061, -0.05543670058250427, -0.015611112117767334, 0.02421446144580841, 0.06404003500938416, 0.1038656234741211, 0.14369121193885803, 0.18351678550243378, 0.22334235906600952, 0.26316794753074646, 0.3029935359954834, 0.34281909465789795, 0.3826446831226349, 0.4224702715873718, 0.46229586005210876, 0.5021214485168457, 0.5419470071792603, 0.5817725658416748, 0.6215981841087341, 0.6614237427711487, 0.701249361038208, 0.7410749197006226, 0.7809004783630371, 0.8207260966300964, 0.860551655292511, 0.9003772735595703, 0.9402028322219849, 0.9800283908843994, 1.019853949546814, 1.0596795082092285, 1.099505066871643, 1.1393306255340576, 1.1791563034057617, 1.2189818620681763, 1.2588074207305908, 1.2986329793930054, 1.33845853805542, 1.378284215927124]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 7.0, 7.0, 13.0, 16.0, 29.0, 30.0, 37.0, 83.0, 127.0, 211.0, 350.0, 662.0, 1368.0, 2851.0, 6833.0, 16991.0, 44322.0, 111464.0, 232892.0, 299522.0, 191745.0, 83593.0, 32938.0, 12733.0, 4993.0, 2269.0, 1124.0, 570.0, 322.0, 160.0, 107.0, 69.0, 37.0, 32.0, 22.0, 9.0, 6.0, 3.0, 3.0, 7.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5185546875, -1.4586334228515625, -1.398712158203125, -1.3387908935546875, -1.27886962890625, -1.2189483642578125, -1.159027099609375, -1.0991058349609375, -1.0391845703125, -0.9792633056640625, -0.919342041015625, -0.8594207763671875, -0.79949951171875, -0.7395782470703125, -0.679656982421875, -0.6197357177734375, -0.559814453125, -0.4998931884765625, -0.439971923828125, -0.3800506591796875, -0.32012939453125, -0.2602081298828125, -0.200286865234375, -0.1403656005859375, -0.0804443359375, -0.0205230712890625, 0.039398193359375, 0.0993194580078125, 0.15924072265625, 0.2191619873046875, 0.279083251953125, 0.3390045166015625, 0.39892578125, 0.4588470458984375, 0.518768310546875, 0.5786895751953125, 0.63861083984375, 0.6985321044921875, 0.758453369140625, 0.8183746337890625, 0.8782958984375, 0.9382171630859375, 0.998138427734375, 1.0580596923828125, 1.11798095703125, 1.1779022216796875, 1.237823486328125, 1.2977447509765625, 1.357666015625, 1.4175872802734375, 1.477508544921875, 1.5374298095703125, 1.59735107421875, 1.6572723388671875, 1.717193603515625, 1.7771148681640625, 1.8370361328125, 1.8969573974609375, 1.956878662109375, 2.0167999267578125, 2.07672119140625, 2.1366424560546875, 2.196563720703125, 2.2564849853515625, 2.31640625]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 7.0, 4.0, 5.0, 13.0, 10.0, 6.0, 12.0, 14.0, 27.0, 18.0, 21.0, 25.0, 30.0, 33.0, 38.0, 47.0, 51.0, 40.0, 53.0, 46.0, 56.0, 48.0, 50.0, 42.0, 35.0, 39.0, 31.0, 34.0, 23.0, 28.0, 24.0, 21.0, 15.0, 11.0, 12.0, 12.0, 7.0, 6.0, 2.0, 2.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.021484375, -1.954132080078125, -1.88677978515625, -1.819427490234375, -1.7520751953125, -1.684722900390625, -1.61737060546875, -1.550018310546875, -1.482666015625, -1.415313720703125, -1.34796142578125, -1.280609130859375, -1.2132568359375, -1.145904541015625, -1.07855224609375, -1.011199951171875, -0.94384765625, -0.876495361328125, -0.80914306640625, -0.741790771484375, -0.6744384765625, -0.607086181640625, -0.53973388671875, -0.472381591796875, -0.405029296875, -0.337677001953125, -0.27032470703125, -0.202972412109375, -0.1356201171875, -0.068267822265625, -0.00091552734375, 0.066436767578125, 0.1337890625, 0.201141357421875, 0.26849365234375, 0.335845947265625, 0.4031982421875, 0.470550537109375, 0.53790283203125, 0.605255126953125, 0.672607421875, 0.739959716796875, 0.80731201171875, 0.874664306640625, 0.9420166015625, 1.009368896484375, 1.07672119140625, 1.144073486328125, 1.21142578125, 1.278778076171875, 1.34613037109375, 1.413482666015625, 1.4808349609375, 1.548187255859375, 1.61553955078125, 1.682891845703125, 1.750244140625, 1.817596435546875, 1.88494873046875, 1.952301025390625, 2.0196533203125, 2.087005615234375, 2.15435791015625, 2.221710205078125, 2.2890625]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 7.0, 3.0, 9.0, 9.0, 10.0, 12.0, 18.0, 29.0, 36.0, 51.0, 84.0, 118.0, 179.0, 310.0, 507.0, 1128.0, 2537.0, 6659.0, 20785.0, 72843.0, 236226.0, 401316.0, 212879.0, 63536.0, 18543.0, 6094.0, 2249.0, 1019.0, 505.0, 291.0, 190.0, 107.0, 91.0, 52.0, 35.0, 23.0, 20.0, 10.0, 12.0, 10.0, 6.0, 4.0, 5.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-3.3203125, -3.229217529296875, -3.13812255859375, -3.047027587890625, -2.9559326171875, -2.864837646484375, -2.77374267578125, -2.682647705078125, -2.591552734375, -2.500457763671875, -2.40936279296875, -2.318267822265625, -2.2271728515625, -2.136077880859375, -2.04498291015625, -1.953887939453125, -1.86279296875, -1.771697998046875, -1.68060302734375, -1.589508056640625, -1.4984130859375, -1.407318115234375, -1.31622314453125, -1.225128173828125, -1.134033203125, -1.042938232421875, -0.95184326171875, -0.860748291015625, -0.7696533203125, -0.678558349609375, -0.58746337890625, -0.496368408203125, -0.4052734375, -0.314178466796875, -0.22308349609375, -0.131988525390625, -0.0408935546875, 0.050201416015625, 0.14129638671875, 0.232391357421875, 0.323486328125, 0.414581298828125, 0.50567626953125, 0.596771240234375, 0.6878662109375, 0.778961181640625, 0.87005615234375, 0.961151123046875, 1.05224609375, 1.143341064453125, 1.23443603515625, 1.325531005859375, 1.4166259765625, 1.507720947265625, 1.59881591796875, 1.689910888671875, 1.781005859375, 1.872100830078125, 1.96319580078125, 2.054290771484375, 2.1453857421875, 2.236480712890625, 2.32757568359375, 2.418670654296875, 2.509765625]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 0.0, 2.0, 3.0, 0.0, 5.0, 1.0, 4.0, 8.0, 12.0, 19.0, 17.0, 12.0, 20.0, 24.0, 32.0, 39.0, 30.0, 44.0, 46.0, 41.0, 50.0, 45.0, 61.0, 57.0, 51.0, 48.0, 46.0, 41.0, 37.0, 31.0, 34.0, 30.0, 24.0, 23.0, 11.0, 15.0, 13.0, 8.0, 6.0, 8.0, 3.0, 7.0, 1.0, 2.0, 1.0, 2.0], "bins": [-3.501953125, -3.415771484375, -3.32958984375, -3.243408203125, -3.1572265625, -3.071044921875, -2.98486328125, -2.898681640625, -2.8125, -2.726318359375, -2.64013671875, -2.553955078125, -2.4677734375, -2.381591796875, -2.29541015625, -2.209228515625, -2.123046875, -2.036865234375, -1.95068359375, -1.864501953125, -1.7783203125, -1.692138671875, -1.60595703125, -1.519775390625, -1.43359375, -1.347412109375, -1.26123046875, -1.175048828125, -1.0888671875, -1.002685546875, -0.91650390625, -0.830322265625, -0.744140625, -0.657958984375, -0.57177734375, -0.485595703125, -0.3994140625, -0.313232421875, -0.22705078125, -0.140869140625, -0.0546875, 0.031494140625, 0.11767578125, 0.203857421875, 0.2900390625, 0.376220703125, 0.46240234375, 0.548583984375, 0.634765625, 0.720947265625, 0.80712890625, 0.893310546875, 0.9794921875, 1.065673828125, 1.15185546875, 1.238037109375, 1.32421875, 1.410400390625, 1.49658203125, 1.582763671875, 1.6689453125, 1.755126953125, 1.84130859375, 1.927490234375, 2.013671875]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 2.0, 3.0, 8.0, 5.0, 8.0, 24.0, 33.0, 40.0, 70.0, 96.0, 148.0, 296.0, 505.0, 1060.0, 2058.0, 4414.0, 9824.0, 23326.0, 57746.0, 134562.0, 254328.0, 308236.0, 144153.0, 62520.0, 25400.0, 10394.0, 4614.0, 2225.0, 1099.0, 573.0, 320.0, 195.0, 95.0, 70.0, 29.0, 24.0, 15.0, 15.0, 5.0, 8.0, 2.0, 1.0, 0.0, 2.0, 5.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.45556640625, -0.43988037109375, -0.4241943359375, -0.40850830078125, -0.392822265625, -0.37713623046875, -0.3614501953125, -0.34576416015625, -0.330078125, -0.31439208984375, -0.2987060546875, -0.28302001953125, -0.267333984375, -0.25164794921875, -0.2359619140625, -0.22027587890625, -0.20458984375, -0.18890380859375, -0.1732177734375, -0.15753173828125, -0.141845703125, -0.12615966796875, -0.1104736328125, -0.09478759765625, -0.0791015625, -0.06341552734375, -0.0477294921875, -0.03204345703125, -0.016357421875, -0.00067138671875, 0.0150146484375, 0.03070068359375, 0.04638671875, 0.06207275390625, 0.0777587890625, 0.09344482421875, 0.109130859375, 0.12481689453125, 0.1405029296875, 0.15618896484375, 0.171875, 0.18756103515625, 0.2032470703125, 0.21893310546875, 0.234619140625, 0.25030517578125, 0.2659912109375, 0.28167724609375, 0.29736328125, 0.31304931640625, 0.3287353515625, 0.34442138671875, 0.360107421875, 0.37579345703125, 0.3914794921875, 0.40716552734375, 0.4228515625, 0.43853759765625, 0.4542236328125, 0.46990966796875, 0.485595703125, 0.50128173828125, 0.5169677734375, 0.53265380859375, 0.54833984375]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 8.0, 3.0, 6.0, 7.0, 15.0, 15.0, 21.0, 28.0, 38.0, 45.0, 68.0, 73.0, 86.0, 165.0, 88.0, 70.0, 59.0, 47.0, 46.0, 24.0, 24.0, 14.0, 22.0, 4.0, 6.0, 4.0, 5.0, 3.0, 7.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001251697540283203, -0.00012028589844703674, -0.00011540204286575317, -0.0001105181872844696, -0.00010563433170318604, -0.00010075047612190247, -9.58666205406189e-05, -9.098276495933533e-05, -8.609890937805176e-05, -8.121505379676819e-05, -7.633119821548462e-05, -7.144734263420105e-05, -6.656348705291748e-05, -6.167963147163391e-05, -5.679577589035034e-05, -5.191192030906677e-05, -4.70280647277832e-05, -4.2144209146499634e-05, -3.7260353565216064e-05, -3.2376497983932495e-05, -2.7492642402648926e-05, -2.2608786821365356e-05, -1.7724931240081787e-05, -1.2841075658798218e-05, -7.957220077514648e-06, -3.073364496231079e-06, 1.8104910850524902e-06, 6.6943466663360596e-06, 1.1578202247619629e-05, 1.6462057828903198e-05, 2.1345913410186768e-05, 2.6229768991470337e-05, 3.1113624572753906e-05, 3.5997480154037476e-05, 4.0881335735321045e-05, 4.5765191316604614e-05, 5.0649046897888184e-05, 5.553290247917175e-05, 6.041675806045532e-05, 6.530061364173889e-05, 7.018446922302246e-05, 7.506832480430603e-05, 7.99521803855896e-05, 8.483603596687317e-05, 8.971989154815674e-05, 9.460374712944031e-05, 9.948760271072388e-05, 0.00010437145829200745, 0.00010925531387329102, 0.00011413916945457458, 0.00011902302503585815, 0.00012390688061714172, 0.0001287907361984253, 0.00013367459177970886, 0.00013855844736099243, 0.000143442302942276, 0.00014832615852355957, 0.00015321001410484314, 0.0001580938696861267, 0.00016297772526741028, 0.00016786158084869385, 0.00017274543642997742, 0.00017762929201126099, 0.00018251314759254456, 0.00018739700317382812]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 6.0, 8.0, 14.0, 23.0, 21.0, 32.0, 50.0, 74.0, 96.0, 142.0, 170.0, 298.0, 379.0, 621.0, 944.0, 1706.0, 2872.0, 5673.0, 11516.0, 27643.0, 77680.0, 215071.0, 400278.0, 189710.0, 66895.0, 24356.0, 10221.0, 5088.0, 2717.0, 1488.0, 962.0, 582.0, 380.0, 279.0, 182.0, 106.0, 79.0, 53.0, 41.0, 26.0, 22.0, 17.0, 12.0, 9.0, 3.0, 2.0, 5.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.67919921875, -0.6561203002929688, -0.6330413818359375, -0.6099624633789062, -0.586883544921875, -0.5638046264648438, -0.5407257080078125, -0.5176467895507812, -0.49456787109375, -0.47148895263671875, -0.4484100341796875, -0.42533111572265625, -0.402252197265625, -0.37917327880859375, -0.3560943603515625, -0.33301544189453125, -0.3099365234375, -0.28685760498046875, -0.2637786865234375, -0.24069976806640625, -0.217620849609375, -0.19454193115234375, -0.1714630126953125, -0.14838409423828125, -0.12530517578125, -0.10222625732421875, -0.0791473388671875, -0.05606842041015625, -0.032989501953125, -0.00991058349609375, 0.0131683349609375, 0.03624725341796875, 0.059326171875, 0.08240509033203125, 0.1054840087890625, 0.12856292724609375, 0.151641845703125, 0.17472076416015625, 0.1977996826171875, 0.22087860107421875, 0.24395751953125, 0.26703643798828125, 0.2901153564453125, 0.31319427490234375, 0.336273193359375, 0.35935211181640625, 0.3824310302734375, 0.40550994873046875, 0.4285888671875, 0.45166778564453125, 0.4747467041015625, 0.49782562255859375, 0.520904541015625, 0.5439834594726562, 0.5670623779296875, 0.5901412963867188, 0.61322021484375, 0.6362991333007812, 0.6593780517578125, 0.6824569702148438, 0.705535888671875, 0.7286148071289062, 0.7516937255859375, 0.7747726440429688, 0.7978515625]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 6.0, 4.0, 1.0, 7.0, 9.0, 14.0, 10.0, 10.0, 23.0, 23.0, 24.0, 40.0, 37.0, 72.0, 67.0, 74.0, 149.0, 74.0, 78.0, 56.0, 46.0, 40.0, 36.0, 28.0, 13.0, 10.0, 13.0, 9.0, 6.0, 6.0, 2.0, 3.0, 2.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.43701171875, -0.4227409362792969, -0.40847015380859375, -0.3941993713378906, -0.3799285888671875, -0.3656578063964844, -0.35138702392578125, -0.3371162414550781, -0.322845458984375, -0.3085746765136719, -0.29430389404296875, -0.2800331115722656, -0.2657623291015625, -0.2514915466308594, -0.23722076416015625, -0.22294998168945312, -0.20867919921875, -0.19440841674804688, -0.18013763427734375, -0.16586685180664062, -0.1515960693359375, -0.13732528686523438, -0.12305450439453125, -0.10878372192382812, -0.094512939453125, -0.08024215698242188, -0.06597137451171875, -0.051700592041015625, -0.0374298095703125, -0.023159027099609375, -0.00888824462890625, 0.005382537841796875, 0.0196533203125, 0.033924102783203125, 0.04819488525390625, 0.062465667724609375, 0.0767364501953125, 0.09100723266601562, 0.10527801513671875, 0.11954879760742188, 0.133819580078125, 0.14809036254882812, 0.16236114501953125, 0.17663192749023438, 0.1909027099609375, 0.20517349243164062, 0.21944427490234375, 0.23371505737304688, 0.24798583984375, 0.2622566223144531, 0.27652740478515625, 0.2907981872558594, 0.3050689697265625, 0.3193397521972656, 0.33361053466796875, 0.3478813171386719, 0.362152099609375, 0.3764228820800781, 0.39069366455078125, 0.4049644470214844, 0.4192352294921875, 0.4335060119628906, 0.44777679443359375, 0.4620475769042969, 0.476318359375]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 8.0, 10.0, 32.0, 48.0, 74.0, 97.0, 128.0, 132.0, 129.0, 111.0, 83.0, 64.0, 48.0, 15.0, 13.0, 3.0, 2.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0425164699554443, -2.838343620300293, -2.6341707706451416, -2.4299979209899902, -2.225825309753418, -2.0216522216796875, -1.8174796104431152, -1.6133067607879639, -1.4091339111328125, -1.2049610614776611, -1.0007882118225098, -0.796615481376648, -0.5924426317214966, -0.3882697820663452, -0.1840970516204834, 0.02007579803466797, 0.22424864768981934, 0.4284214675426483, 0.6325942873954773, 0.8367670774459839, 1.0409399271011353, 1.2451127767562866, 1.4492855072021484, 1.6534583568572998, 1.8576312065124512, 2.0618040561676025, 2.265976905822754, 2.470149517059326, 2.6743226051330566, 2.878495216369629, 3.0826680660247803, 3.2868409156799316, 3.491013526916504, 3.6951863765716553, 3.8993592262268066, 4.103531837463379, 4.307704925537109, 4.511877536773682, 4.716050148010254, 4.920223236083984, 5.124396324157715, 5.328568935394287, 5.532742023468018, 5.73691463470459, 5.94108772277832, 6.145260334014893, 6.349432945251465, 6.553606033325195, 6.757778644561768, 6.96195125579834, 7.16612434387207, 7.370296955108643, 7.574470043182373, 7.778642654418945, 7.982815742492676, 8.186988830566406, 8.39116096496582, 8.59533405303955, 8.799506187438965, 9.003679275512695, 9.207852363586426, 9.412025451660156, 9.61619758605957, 9.8203706741333, 10.024543762207031]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 5.0, 4.0, 7.0, 9.0, 9.0, 12.0, 14.0, 9.0, 22.0, 16.0, 27.0, 28.0, 27.0, 36.0, 30.0, 41.0, 38.0, 39.0, 47.0, 64.0, 45.0, 59.0, 46.0, 51.0, 43.0, 32.0, 44.0, 28.0, 31.0, 14.0, 26.0, 13.0, 16.0, 12.0, 12.0, 9.0, 11.0, 7.0, 7.0, 2.0, 2.0, 3.0, 0.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0], "bins": [-4.560827255249023, -4.430590629577637, -4.30035400390625, -4.170117378234863, -4.039880752563477, -3.90964412689209, -3.779407501220703, -3.6491708755493164, -3.5189342498779297, -3.388697624206543, -3.2584609985351562, -3.1282243728637695, -2.997987747192383, -2.867751121520996, -2.7375144958496094, -2.6072778701782227, -2.477041006088257, -2.34680438041687, -2.2165677547454834, -2.0863311290740967, -1.95609450340271, -1.8258578777313232, -1.695621132850647, -1.5653845071792603, -1.4351478815078735, -1.3049112558364868, -1.1746746301651, -1.0444378852844238, -0.9142013192176819, -0.7839646935462952, -0.6537280082702637, -0.523491382598877, -0.39325475692749023, -0.2630181312561035, -0.1327814757823944, -0.0025448203086853027, 0.12769180536270142, 0.25792843103408813, 0.38816511631011963, 0.5184017419815063, 0.6486383676528931, 0.7788749933242798, 0.9091116189956665, 1.0393483638763428, 1.1695849895477295, 1.2998216152191162, 1.430058240890503, 1.5602948665618896, 1.6905314922332764, 1.820768117904663, 1.9510047435760498, 2.0812413692474365, 2.2114779949188232, 2.34171462059021, 2.471951484680176, 2.6021881103515625, 2.732424736022949, 2.862661361694336, 2.9928979873657227, 3.1231346130371094, 3.253371238708496, 3.383607864379883, 3.5138444900512695, 3.6440811157226562, 3.774317741394043]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 4.0, 1.0, 0.0, 3.0, 2.0, 4.0, 2.0, 5.0, 9.0, 6.0, 9.0, 15.0, 21.0, 19.0, 36.0, 51.0, 70.0, 120.0, 200.0, 292.0, 455.0, 761.0, 1238.0, 2073.0, 3264.0, 5536.0, 9887.0, 1002119.0, 9941.0, 5648.0, 3506.0, 2052.0, 1191.0, 736.0, 459.0, 287.0, 192.0, 113.0, 84.0, 52.0, 34.0, 25.0, 20.0, 13.0, 15.0, 10.0, 9.0, 8.0, 4.0, 4.0, 1.0, 4.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7727837562561035, -3.6491355895996094, -3.5254874229431152, -3.401839256286621, -3.278191328048706, -3.154543161392212, -3.0308949947357178, -2.9072468280792236, -2.7835988998413086, -2.6599507331848145, -2.5363025665283203, -2.412654399871826, -2.289006471633911, -2.165358304977417, -2.041710138320923, -1.9180619716644287, -1.7944138050079346, -1.6707656383514404, -1.5471175909042358, -1.4234694242477417, -1.299821376800537, -1.176173210144043, -1.0525250434875488, -0.9288769364356995, -0.8052288293838501, -0.6815807223320007, -0.5579326152801514, -0.4342844486236572, -0.31063634157180786, -0.1869882345199585, -0.06334006786346436, 0.06030803918838501, 0.18395614624023438, 0.30760425329208374, 0.4312523901462555, 0.5549005270004272, 0.6785486340522766, 0.802196741104126, 0.9258449077606201, 1.0494930744171143, 1.1731411218643188, 1.296789288520813, 1.4204373359680176, 1.5440855026245117, 1.6677336692810059, 1.7913817167282104, 1.9150298833847046, 2.038677930831909, 2.1623260974884033, 2.2859742641448975, 2.4096224308013916, 2.5332703590393066, 2.656918525695801, 2.780566692352295, 2.904214859008789, 3.027863025665283, 3.1515111923217773, 3.2751593589782715, 3.3988075256347656, 3.5224556922912598, 3.646103620529175, 3.769751787185669, 3.893399953842163, 4.017047882080078, 4.140696048736572]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 3.0, 4.0, 7.0, 7.0, 15.0, 37.0, 68.0, 170.0, 577.0, 1603.0, 10461.0, 249047.0, 51187748.0, 17422.0, 2241.0, 579.0, 246.0, 98.0, 49.0, 34.0, 11.0, 12.0, 3.0, 6.0, 5.0, 5.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.59375, -17.95361328125, -17.3134765625, -16.67333984375, -16.033203125, -15.39306640625, -14.7529296875, -14.11279296875, -13.47265625, -12.83251953125, -12.1923828125, -11.55224609375, -10.912109375, -10.27197265625, -9.6318359375, -8.99169921875, -8.3515625, -7.71142578125, -7.0712890625, -6.43115234375, -5.791015625, -5.15087890625, -4.5107421875, -3.87060546875, -3.23046875, -2.59033203125, -1.9501953125, -1.31005859375, -0.669921875, -0.02978515625, 0.6103515625, 1.25048828125, 1.890625, 2.53076171875, 3.1708984375, 3.81103515625, 4.451171875, 5.09130859375, 5.7314453125, 6.37158203125, 7.01171875, 7.65185546875, 8.2919921875, 8.93212890625, 9.572265625, 10.21240234375, 10.8525390625, 11.49267578125, 12.1328125, 12.77294921875, 13.4130859375, 14.05322265625, 14.693359375, 15.33349609375, 15.9736328125, 16.61376953125, 17.25390625, 17.89404296875, 18.5341796875, 19.17431640625, 19.814453125, 20.45458984375, 21.0947265625, 21.73486328125, 22.375]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 5.0, 6.0, 1.0, 1.0, 11.0, 12.0, 11.0, 31.0, 49.0, 48.0, 91.0, 144.0, 203.0, 348.0, 471.0, 783.0, 1379.0, 2330.0, 3880.0, 6875.0, 12414.0, 22343.0, 40708.0, 76113.0, 138702.0, 239028.0, 375659.0, 528286.0, 3649618.0, 451694.0, 313432.0, 189470.0, 107555.0, 58313.0, 31436.0, 17177.0, 9502.0, 5392.0, 3223.0, 1801.0, 1110.0, 652.0, 393.0, 252.0, 160.0, 107.0, 61.0, 64.0, 41.0, 18.0, 17.0, 9.0, 3.0, 9.0, 2.0, 2.0], "bins": [-1.3916015625, -1.353240966796875, -1.31488037109375, -1.276519775390625, -1.2381591796875, -1.199798583984375, -1.16143798828125, -1.123077392578125, -1.084716796875, -1.046356201171875, -1.00799560546875, -0.969635009765625, -0.9312744140625, -0.892913818359375, -0.85455322265625, -0.816192626953125, -0.77783203125, -0.739471435546875, -0.70111083984375, -0.662750244140625, -0.6243896484375, -0.586029052734375, -0.54766845703125, -0.509307861328125, -0.470947265625, -0.432586669921875, -0.39422607421875, -0.355865478515625, -0.3175048828125, -0.279144287109375, -0.24078369140625, -0.202423095703125, -0.1640625, -0.125701904296875, -0.08734130859375, -0.048980712890625, -0.0106201171875, 0.027740478515625, 0.06610107421875, 0.104461669921875, 0.142822265625, 0.181182861328125, 0.21954345703125, 0.257904052734375, 0.2962646484375, 0.334625244140625, 0.37298583984375, 0.411346435546875, 0.44970703125, 0.488067626953125, 0.52642822265625, 0.564788818359375, 0.6031494140625, 0.641510009765625, 0.67987060546875, 0.718231201171875, 0.756591796875, 0.794952392578125, 0.83331298828125, 0.871673583984375, 0.9100341796875, 0.948394775390625, 0.98675537109375, 1.025115966796875, 1.0634765625]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 5.0, 10.0, 3.0, 9.0, 8.0, 10.0, 15.0, 13.0, 27.0, 17.0, 27.0, 36.0, 33.0, 44.0, 41.0, 45.0, 57.0, 62.0, 1069.0, 57.0, 51.0, 53.0, 43.0, 44.0, 47.0, 39.0, 33.0, 20.0, 24.0, 21.0, 16.0, 15.0, 6.0, 9.0, 6.0, 2.0, 5.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0], "bins": [-25.90625, -25.231689453125, -24.55712890625, -23.882568359375, -23.2080078125, -22.533447265625, -21.85888671875, -21.184326171875, -20.509765625, -19.835205078125, -19.16064453125, -18.486083984375, -17.8115234375, -17.136962890625, -16.46240234375, -15.787841796875, -15.11328125, -14.438720703125, -13.76416015625, -13.089599609375, -12.4150390625, -11.740478515625, -11.06591796875, -10.391357421875, -9.716796875, -9.042236328125, -8.36767578125, -7.693115234375, -7.0185546875, -6.343994140625, -5.66943359375, -4.994873046875, -4.3203125, -3.645751953125, -2.97119140625, -2.296630859375, -1.6220703125, -0.947509765625, -0.27294921875, 0.401611328125, 1.076171875, 1.750732421875, 2.42529296875, 3.099853515625, 3.7744140625, 4.448974609375, 5.12353515625, 5.798095703125, 6.47265625, 7.147216796875, 7.82177734375, 8.496337890625, 9.1708984375, 9.845458984375, 10.52001953125, 11.194580078125, 11.869140625, 12.543701171875, 13.21826171875, 13.892822265625, 14.5673828125, 15.241943359375, 15.91650390625, 16.591064453125, 17.265625]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [6.0, 1.0, 7.0, 7.0, 10.0, 9.0, 19.0, 23.0, 50.0, 56.0, 104.0, 135.0, 220.0, 321.0, 489.0, 787.0, 1196.0, 1879.0, 2983.0, 4851.0, 8047.0, 13192.0, 21361.0, 35923.0, 58676.0, 95352.0, 150522.0, 223100.0, 309431.0, 386544.0, 3535032.0, 425368.0, 329570.0, 243953.0, 165967.0, 106690.0, 66348.0, 40233.0, 24408.0, 14533.0, 9013.0, 5527.0, 3371.0, 2131.0, 1340.0, 936.0, 589.0, 395.0, 242.0, 158.0, 101.0, 79.0, 61.0, 42.0, 18.0, 14.0, 14.0, 7.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0], "bins": [-0.87548828125, -0.846893310546875, -0.81829833984375, -0.789703369140625, -0.7611083984375, -0.732513427734375, -0.70391845703125, -0.675323486328125, -0.646728515625, -0.618133544921875, -0.58953857421875, -0.560943603515625, -0.5323486328125, -0.503753662109375, -0.47515869140625, -0.446563720703125, -0.41796875, -0.389373779296875, -0.36077880859375, -0.332183837890625, -0.3035888671875, -0.274993896484375, -0.24639892578125, -0.217803955078125, -0.189208984375, -0.160614013671875, -0.13201904296875, -0.103424072265625, -0.0748291015625, -0.046234130859375, -0.01763916015625, 0.010955810546875, 0.03955078125, 0.068145751953125, 0.09674072265625, 0.125335693359375, 0.1539306640625, 0.182525634765625, 0.21112060546875, 0.239715576171875, 0.268310546875, 0.296905517578125, 0.32550048828125, 0.354095458984375, 0.3826904296875, 0.411285400390625, 0.43988037109375, 0.468475341796875, 0.4970703125, 0.525665283203125, 0.55426025390625, 0.582855224609375, 0.6114501953125, 0.640045166015625, 0.66864013671875, 0.697235107421875, 0.725830078125, 0.754425048828125, 0.78302001953125, 0.811614990234375, 0.8402099609375, 0.868804931640625, 0.89739990234375, 0.925994873046875, 0.95458984375]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 7.0, 10.0, 6.0, 13.0, 16.0, 18.0, 25.0, 18.0, 20.0, 34.0, 42.0, 38.0, 36.0, 43.0, 41.0, 39.0, 51.0, 1036.0, 73.0, 45.0, 53.0, 44.0, 37.0, 47.0, 43.0, 37.0, 21.0, 24.0, 26.0, 13.0, 18.0, 12.0, 12.0, 8.0, 6.0, 2.0, 3.0, 3.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.875, -17.327392578125, -16.77978515625, -16.232177734375, -15.6845703125, -15.136962890625, -14.58935546875, -14.041748046875, -13.494140625, -12.946533203125, -12.39892578125, -11.851318359375, -11.3037109375, -10.756103515625, -10.20849609375, -9.660888671875, -9.11328125, -8.565673828125, -8.01806640625, -7.470458984375, -6.9228515625, -6.375244140625, -5.82763671875, -5.280029296875, -4.732421875, -4.184814453125, -3.63720703125, -3.089599609375, -2.5419921875, -1.994384765625, -1.44677734375, -0.899169921875, -0.3515625, 0.196044921875, 0.74365234375, 1.291259765625, 1.8388671875, 2.386474609375, 2.93408203125, 3.481689453125, 4.029296875, 4.576904296875, 5.12451171875, 5.672119140625, 6.2197265625, 6.767333984375, 7.31494140625, 7.862548828125, 8.41015625, 8.957763671875, 9.50537109375, 10.052978515625, 10.6005859375, 11.148193359375, 11.69580078125, 12.243408203125, 12.791015625, 13.338623046875, 13.88623046875, 14.433837890625, 14.9814453125, 15.529052734375, 16.07666015625, 16.624267578125, 17.171875]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 4.0, 12.0, 17.0, 17.0, 23.0, 35.0, 41.0, 49.0, 64.0, 101.0, 151.0, 254.0, 418.0, 686.0, 1228.0, 2089.0, 3947.0, 7584.0, 14279.0, 28177.0, 55850.0, 113091.0, 5641262.0, 239639.0, 89440.0, 44455.0, 22851.0, 11958.0, 6082.0, 3157.0, 1795.0, 1066.0, 559.0, 337.0, 220.0, 160.0, 118.0, 62.0, 39.0, 28.0, 24.0, 15.0, 14.0, 8.0, 7.0, 6.0, 4.0, 9.0, 5.0, 0.0, 0.0, 5.0, 2.0, 2.0, 1.0], "bins": [-3.294921875, -3.191436767578125, -3.08795166015625, -2.984466552734375, -2.8809814453125, -2.777496337890625, -2.67401123046875, -2.570526123046875, -2.467041015625, -2.363555908203125, -2.26007080078125, -2.156585693359375, -2.0531005859375, -1.949615478515625, -1.84613037109375, -1.742645263671875, -1.63916015625, -1.535675048828125, -1.43218994140625, -1.328704833984375, -1.2252197265625, -1.121734619140625, -1.01824951171875, -0.914764404296875, -0.811279296875, -0.707794189453125, -0.60430908203125, -0.500823974609375, -0.3973388671875, -0.293853759765625, -0.19036865234375, -0.086883544921875, 0.0166015625, 0.120086669921875, 0.22357177734375, 0.327056884765625, 0.4305419921875, 0.534027099609375, 0.63751220703125, 0.740997314453125, 0.844482421875, 0.947967529296875, 1.05145263671875, 1.154937744140625, 1.2584228515625, 1.361907958984375, 1.46539306640625, 1.568878173828125, 1.67236328125, 1.775848388671875, 1.87933349609375, 1.982818603515625, 2.0863037109375, 2.189788818359375, 2.29327392578125, 2.396759033203125, 2.500244140625, 2.603729248046875, 2.70721435546875, 2.810699462890625, 2.9141845703125, 3.017669677734375, 3.12115478515625, 3.224639892578125, 3.328125]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 3.0, 4.0, 9.0, 11.0, 8.0, 15.0, 11.0, 17.0, 26.0, 24.0, 28.0, 32.0, 36.0, 43.0, 44.0, 39.0, 43.0, 38.0, 83.0, 1037.0, 46.0, 47.0, 41.0, 40.0, 37.0, 33.0, 41.0, 34.0, 26.0, 23.0, 21.0, 19.0, 18.0, 8.0, 10.0, 5.0, 12.0, 7.0, 4.0, 2.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.28125, -15.79248046875, -15.3037109375, -14.81494140625, -14.326171875, -13.83740234375, -13.3486328125, -12.85986328125, -12.37109375, -11.88232421875, -11.3935546875, -10.90478515625, -10.416015625, -9.92724609375, -9.4384765625, -8.94970703125, -8.4609375, -7.97216796875, -7.4833984375, -6.99462890625, -6.505859375, -6.01708984375, -5.5283203125, -5.03955078125, -4.55078125, -4.06201171875, -3.5732421875, -3.08447265625, -2.595703125, -2.10693359375, -1.6181640625, -1.12939453125, -0.640625, -0.15185546875, 0.3369140625, 0.82568359375, 1.314453125, 1.80322265625, 2.2919921875, 2.78076171875, 3.26953125, 3.75830078125, 4.2470703125, 4.73583984375, 5.224609375, 5.71337890625, 6.2021484375, 6.69091796875, 7.1796875, 7.66845703125, 8.1572265625, 8.64599609375, 9.134765625, 9.62353515625, 10.1123046875, 10.60107421875, 11.08984375, 11.57861328125, 12.0673828125, 12.55615234375, 13.044921875, 13.53369140625, 14.0224609375, 14.51123046875, 15.0]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 19.0, 60.0, 346.0, 436.0, 106.0, 27.0, 8.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.49773406982422, -61.635929107666016, -59.77412033081055, -57.912315368652344, -56.050506591796875, -54.18870162963867, -52.32689666748047, -50.465087890625, -48.6032829284668, -46.741477966308594, -44.879669189453125, -43.01786422729492, -41.15605926513672, -39.29425048828125, -37.43244552612305, -35.570640563964844, -33.708831787109375, -31.84702491760254, -29.985218048095703, -28.1234130859375, -26.261606216430664, -24.399799346923828, -22.537994384765625, -20.67618751525879, -18.814380645751953, -16.952573776245117, -15.090767860412598, -13.228961944580078, -11.367155075073242, -9.505348205566406, -7.643542289733887, -5.781736373901367, -3.9199295043945312, -2.0581231117248535, -0.19631671905517578, 1.665489673614502, 3.5272960662841797, 5.389102935791016, 7.250908851623535, 9.112714767456055, 10.97452163696289, 12.836328506469727, 14.698134422302246, 16.559940338134766, 18.4217472076416, 20.283554077148438, 22.14535903930664, 24.007165908813477, 25.868972778320312, 27.73077964782715, 29.592586517333984, 31.454391479492188, 33.316200256347656, 35.17800521850586, 37.03981018066406, 38.90161895751953, 40.763423919677734, 42.62522888183594, 44.487037658691406, 46.34884262084961, 48.21064758300781, 50.07245635986328, 51.934261322021484, 53.79606628417969, 55.657875061035156]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 4.0, 8.0, 6.0, 10.0, 11.0, 8.0, 7.0, 14.0, 26.0, 18.0, 30.0, 41.0, 47.0, 54.0, 66.0, 71.0, 78.0, 84.0, 69.0, 72.0, 60.0, 36.0, 39.0, 31.0, 22.0, 20.0, 18.0, 11.0, 8.0, 9.0, 8.0, 5.0, 5.0, 4.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-44.118831634521484, -42.92047119140625, -41.72210693359375, -40.52374267578125, -39.325382232666016, -38.12702178955078, -36.92865753173828, -35.73029327392578, -34.53193283081055, -33.33357238769531, -32.13520812988281, -30.936845779418945, -29.738483428955078, -28.54012107849121, -27.341758728027344, -26.143396377563477, -24.94503402709961, -23.746671676635742, -22.548309326171875, -21.349946975708008, -20.15158462524414, -18.953222274780273, -17.754859924316406, -16.55649757385254, -15.358135223388672, -14.159772872924805, -12.961410522460938, -11.76304817199707, -10.564685821533203, -9.366323471069336, -8.167961120605469, -6.969598770141602, -5.771232604980469, -4.572870254516602, -3.3745079040527344, -2.176145553588867, -0.977783203125, 0.2205791473388672, 1.4189414978027344, 2.6173038482666016, 3.8156661987304688, 5.014028549194336, 6.212390899658203, 7.41075325012207, 8.609115600585938, 9.807477951049805, 11.005840301513672, 12.204202651977539, 13.402565002441406, 14.600927352905273, 15.79928970336914, 16.997652053833008, 18.196014404296875, 19.394376754760742, 20.59273910522461, 21.791101455688477, 22.989463806152344, 24.18782615661621, 25.386188507080078, 26.584550857543945, 27.782913208007812, 28.98127555847168, 30.179637908935547, 31.378000259399414, 32.57636260986328]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 4.0, 6.0, 9.0, 9.0, 10.0, 18.0, 18.0, 27.0, 41.0, 53.0, 50.0, 97.0, 140.0, 231.0, 378.0, 596.0, 1106.0, 1920.0, 4064.0, 10624.0, 39314.0, 3876150.0, 216255.0, 27384.0, 8435.0, 3497.0, 1648.0, 843.0, 494.0, 277.0, 187.0, 128.0, 87.0, 69.0, 30.0, 25.0, 13.0, 17.0, 15.0, 6.0, 5.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.284912109375, -0.2767353057861328, -0.2685585021972656, -0.26038169860839844, -0.25220489501953125, -0.24402809143066406, -0.23585128784179688, -0.2276744842529297, -0.2194976806640625, -0.2113208770751953, -0.20314407348632812, -0.19496726989746094, -0.18679046630859375, -0.17861366271972656, -0.17043685913085938, -0.1622600555419922, -0.154083251953125, -0.1459064483642578, -0.13772964477539062, -0.12955284118652344, -0.12137603759765625, -0.11319923400878906, -0.10502243041992188, -0.09684562683105469, -0.0886688232421875, -0.08049201965332031, -0.07231521606445312, -0.06413841247558594, -0.05596160888671875, -0.04778480529785156, -0.039608001708984375, -0.03143119812011719, -0.02325439453125, -0.015077590942382812, -0.006900787353515625, 0.0012760162353515625, 0.00945281982421875, 0.017629623413085938, 0.025806427001953125, 0.03398323059082031, 0.0421600341796875, 0.05033683776855469, 0.058513641357421875, 0.06669044494628906, 0.07486724853515625, 0.08304405212402344, 0.09122085571289062, 0.09939765930175781, 0.107574462890625, 0.11575126647949219, 0.12392807006835938, 0.13210487365722656, 0.14028167724609375, 0.14845848083496094, 0.15663528442382812, 0.1648120880126953, 0.1729888916015625, 0.1811656951904297, 0.18934249877929688, 0.19751930236816406, 0.20569610595703125, 0.21387290954589844, 0.22204971313476562, 0.2302265167236328, 0.2384033203125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 5.0, 4.0, 3.0, 3.0, 2.0, 3.0, 3.0, 11.0, 7.0, 10.0, 14.0, 9.0, 13.0, 145.0, 633.0, 13.0, 16.0, 15.0, 6.0, 3.0, 9.0, 6.0, 8.0, 8.0, 4.0, 5.0, 4.0, 8.0, 4.0, 4.0, 4.0, 2.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.126708984375, -0.12277412414550781, -0.11883926391601562, -0.11490440368652344, -0.11096954345703125, -0.10703468322753906, -0.10309982299804688, -0.09916496276855469, -0.0952301025390625, -0.09129524230957031, -0.08736038208007812, -0.08342552185058594, -0.07949066162109375, -0.07555580139160156, -0.07162094116210938, -0.06768608093261719, -0.063751220703125, -0.05981636047363281, -0.055881500244140625, -0.05194664001464844, -0.04801177978515625, -0.04407691955566406, -0.040142059326171875, -0.03620719909667969, -0.0322723388671875, -0.028337478637695312, -0.024402618408203125, -0.020467758178710938, -0.01653289794921875, -0.012598037719726562, -0.008663177490234375, -0.0047283172607421875, -0.00079345703125, 0.0031414031982421875, 0.007076263427734375, 0.011011123657226562, 0.01494598388671875, 0.018880844116210938, 0.022815704345703125, 0.026750564575195312, 0.0306854248046875, 0.03462028503417969, 0.038555145263671875, 0.04249000549316406, 0.04642486572265625, 0.05035972595214844, 0.054294586181640625, 0.05822944641113281, 0.062164306640625, 0.06609916687011719, 0.07003402709960938, 0.07396888732910156, 0.07790374755859375, 0.08183860778808594, 0.08577346801757812, 0.08970832824707031, 0.0936431884765625, 0.09757804870605469, 0.10151290893554688, 0.10544776916503906, 0.10938262939453125, 0.11331748962402344, 0.11725234985351562, 0.12118721008300781, 0.1251220703125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 1.0, 7.0, 11.0, 11.0, 8.0, 15.0, 31.0, 47.0, 76.0, 104.0, 190.0, 242.0, 519.0, 898.0, 1891.0, 4489.0, 12288.0, 51202.0, 528236.0, 3384147.0, 172474.0, 25364.0, 7039.0, 2568.0, 1187.0, 555.0, 277.0, 140.0, 81.0, 66.0, 38.0, 34.0, 17.0, 13.0, 6.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1990966796875, -0.19329452514648438, -0.18749237060546875, -0.18169021606445312, -0.1758880615234375, -0.17008590698242188, -0.16428375244140625, -0.15848159790039062, -0.152679443359375, -0.14687728881835938, -0.14107513427734375, -0.13527297973632812, -0.1294708251953125, -0.12366867065429688, -0.11786651611328125, -0.11206436157226562, -0.10626220703125, -0.10046005249023438, -0.09465789794921875, -0.08885574340820312, -0.0830535888671875, -0.07725143432617188, -0.07144927978515625, -0.06564712524414062, -0.059844970703125, -0.054042816162109375, -0.04824066162109375, -0.042438507080078125, -0.0366363525390625, -0.030834197998046875, -0.02503204345703125, -0.019229888916015625, -0.013427734375, -0.007625579833984375, -0.00182342529296875, 0.003978729248046875, 0.0097808837890625, 0.015583038330078125, 0.02138519287109375, 0.027187347412109375, 0.032989501953125, 0.038791656494140625, 0.04459381103515625, 0.050395965576171875, 0.0561981201171875, 0.062000274658203125, 0.06780242919921875, 0.07360458374023438, 0.07940673828125, 0.08520889282226562, 0.09101104736328125, 0.09681320190429688, 0.1026153564453125, 0.10841751098632812, 0.11421966552734375, 0.12002182006835938, 0.125823974609375, 0.13162612915039062, 0.13742828369140625, 0.14323043823242188, 0.1490325927734375, 0.15483474731445312, 0.16063690185546875, 0.16643905639648438, 0.1722412109375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 2.0, 2.0, 6.0, 1.0, 4.0, 7.0, 8.0, 18.0, 21.0, 24.0, 43.0, 56.0, 111.0, 218.0, 511.0, 1617.0, 822.0, 295.0, 125.0, 68.0, 45.0, 22.0, 10.0, 12.0, 12.0, 4.0, 1.0, 3.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1673583984375, -0.16324996948242188, -0.15914154052734375, -0.15503311157226562, -0.1509246826171875, -0.14681625366210938, -0.14270782470703125, -0.13859939575195312, -0.134490966796875, -0.13038253784179688, -0.12627410888671875, -0.12216567993164062, -0.1180572509765625, -0.11394882202148438, -0.10984039306640625, -0.10573196411132812, -0.10162353515625, -0.09751510620117188, -0.09340667724609375, -0.08929824829101562, -0.0851898193359375, -0.08108139038085938, -0.07697296142578125, -0.07286453247070312, -0.068756103515625, -0.06464767456054688, -0.06053924560546875, -0.056430816650390625, -0.0523223876953125, -0.048213958740234375, -0.04410552978515625, -0.039997100830078125, -0.035888671875, -0.031780242919921875, -0.02767181396484375, -0.023563385009765625, -0.0194549560546875, -0.015346527099609375, -0.01123809814453125, -0.007129669189453125, -0.003021240234375, 0.001087188720703125, 0.00519561767578125, 0.009304046630859375, 0.0134124755859375, 0.017520904541015625, 0.02162933349609375, 0.025737762451171875, 0.02984619140625, 0.033954620361328125, 0.03806304931640625, 0.042171478271484375, 0.0462799072265625, 0.050388336181640625, 0.05449676513671875, 0.058605194091796875, 0.062713623046875, 0.06682205200195312, 0.07093048095703125, 0.07503890991210938, 0.0791473388671875, 0.08325576782226562, 0.08736419677734375, 0.09147262573242188, 0.0955810546875]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 6.0, 24.0, 341.0, 604.0, 26.0, 7.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9000369310379028, -0.8366281986236572, -0.7732194662094116, -0.7098106741905212, -0.6464019417762756, -0.58299320936203, -0.5195844173431396, -0.45617568492889404, -0.39276695251464844, -0.32935822010040283, -0.26594945788383484, -0.20254071056842804, -0.13913196325302124, -0.07572323083877563, -0.012314468622207642, 0.05109429359436035, 0.11450302600860596, 0.17791177332401276, 0.24132052063941956, 0.30472928285598755, 0.36813801527023315, 0.43154674768447876, 0.49495550990104675, 0.5583642721176147, 0.6217730045318604, 0.685181736946106, 0.7485904693603516, 0.8119992613792419, 0.8754079937934875, 0.9388167262077332, 1.0022255182266235, 1.0656342506408691, 1.1290431022644043, 1.19245183467865, 1.2558605670928955, 1.3192692995071411, 1.3826780319213867, 1.4460868835449219, 1.5094956159591675, 1.572904348373413, 1.6363130807876587, 1.6997218132019043, 1.76313054561615, 1.8265392780303955, 1.8899481296539307, 1.9533567428588867, 2.016765594482422, 2.080174446105957, 2.143583059310913, 2.2069919109344482, 2.2704005241394043, 2.3338093757629395, 2.3972179889678955, 2.4606268405914307, 2.5240354537963867, 2.587444305419922, 2.650853157043457, 2.714262008666992, 2.7776706218719482, 2.8410794734954834, 2.9044880867004395, 2.9678969383239746, 3.0313055515289307, 3.094714403152466, 3.158123016357422]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 3.0, 6.0, 4.0, 3.0, 7.0, 9.0, 10.0, 13.0, 22.0, 22.0, 25.0, 43.0, 36.0, 56.0, 70.0, 90.0, 70.0, 83.0, 78.0, 75.0, 62.0, 57.0, 44.0, 30.0, 29.0, 15.0, 12.0, 10.0, 10.0, 4.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3349156975746155, -0.3195090889930725, -0.30410248041152954, -0.2886958718299866, -0.2732892632484436, -0.25788265466690063, -0.24247604608535767, -0.2270694375038147, -0.21166282892227173, -0.19625622034072876, -0.1808496117591858, -0.16544300317764282, -0.15003639459609985, -0.13462978601455688, -0.11922316998243332, -0.10381656140089035, -0.08840994536876678, -0.07300333678722382, -0.05759672820568085, -0.04219011589884758, -0.02678350731730461, -0.011376895010471344, 0.004029713571071625, 0.019436322152614594, 0.03484293073415756, 0.05024953931570053, 0.0656561478972435, 0.08106276392936707, 0.09646937251091003, 0.111875981092453, 0.12728258967399597, 0.14268919825553894, 0.1580958068370819, 0.17350241541862488, 0.18890902400016785, 0.20431563258171082, 0.21972224116325378, 0.23512884974479675, 0.2505354583263397, 0.2659420669078827, 0.28134867548942566, 0.29675528407096863, 0.3121618926525116, 0.32756850123405457, 0.34297510981559753, 0.3583817183971405, 0.37378832697868347, 0.38919493556022644, 0.4046015739440918, 0.42000818252563477, 0.43541479110717773, 0.4508213996887207, 0.46622800827026367, 0.48163461685180664, 0.4970412254333496, 0.5124478340148926, 0.5278544425964355, 0.5432610511779785, 0.5586676597595215, 0.5740742683410645, 0.5894808769226074, 0.6048874855041504, 0.6202940940856934, 0.6357007026672363, 0.6511073112487793]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 6.0, 7.0, 13.0, 14.0, 28.0, 31.0, 37.0, 47.0, 71.0, 83.0, 107.0, 135.0, 221.0, 237.0, 369.0, 428.0, 620.0, 795.0, 1071.0, 1373.0, 1957.0, 2729.0, 3981.0, 5776.0, 9028.0, 14686.0, 25925.0, 88531.0, 806472.0, 33025.0, 17521.0, 10430.0, 6715.0, 4458.0, 3181.0, 2224.0, 1598.0, 1173.0, 891.0, 626.0, 475.0, 326.0, 251.0, 226.0, 132.0, 142.0, 78.0, 73.0, 64.0, 41.0, 32.0, 35.0, 21.0, 17.0, 14.0, 6.0, 7.0, 5.0, 1.0, 3.0], "bins": [-0.422119140625, -0.40899658203125, -0.3958740234375, -0.38275146484375, -0.36962890625, -0.35650634765625, -0.3433837890625, -0.33026123046875, -0.317138671875, -0.30401611328125, -0.2908935546875, -0.27777099609375, -0.2646484375, -0.25152587890625, -0.2384033203125, -0.22528076171875, -0.212158203125, -0.19903564453125, -0.1859130859375, -0.17279052734375, -0.15966796875, -0.14654541015625, -0.1334228515625, -0.12030029296875, -0.107177734375, -0.09405517578125, -0.0809326171875, -0.06781005859375, -0.0546875, -0.04156494140625, -0.0284423828125, -0.01531982421875, -0.002197265625, 0.01092529296875, 0.0240478515625, 0.03717041015625, 0.05029296875, 0.06341552734375, 0.0765380859375, 0.08966064453125, 0.102783203125, 0.11590576171875, 0.1290283203125, 0.14215087890625, 0.1552734375, 0.16839599609375, 0.1815185546875, 0.19464111328125, 0.207763671875, 0.22088623046875, 0.2340087890625, 0.24713134765625, 0.26025390625, 0.27337646484375, 0.2864990234375, 0.29962158203125, 0.312744140625, 0.32586669921875, 0.3389892578125, 0.35211181640625, 0.365234375, 0.37835693359375, 0.3914794921875, 0.40460205078125, 0.417724609375]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 5.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 3.0, 2.0, 4.0, 3.0, 2.0, 13.0, 6.0, 10.0, 10.0, 11.0, 8.0, 52.0, 696.0, 44.0, 14.0, 20.0, 6.0, 5.0, 5.0, 6.0, 7.0, 11.0, 3.0, 5.0, 6.0, 5.0, 6.0, 3.0, 3.0, 5.0, 4.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.12353515625, -0.1197500228881836, -0.11596488952636719, -0.11217975616455078, -0.10839462280273438, -0.10460948944091797, -0.10082435607910156, -0.09703922271728516, -0.09325408935546875, -0.08946895599365234, -0.08568382263183594, -0.08189868927001953, -0.07811355590820312, -0.07432842254638672, -0.07054328918457031, -0.0667581558227539, -0.0629730224609375, -0.059187889099121094, -0.05540275573730469, -0.05161762237548828, -0.047832489013671875, -0.04404735565185547, -0.04026222229003906, -0.036477088928222656, -0.03269195556640625, -0.028906822204589844, -0.025121688842773438, -0.02133655548095703, -0.017551422119140625, -0.013766288757324219, -0.009981155395507812, -0.006196022033691406, -0.002410888671875, 0.0013742446899414062, 0.0051593780517578125, 0.008944511413574219, 0.012729644775390625, 0.01651477813720703, 0.020299911499023438, 0.024085044860839844, 0.02787017822265625, 0.031655311584472656, 0.03544044494628906, 0.03922557830810547, 0.043010711669921875, 0.04679584503173828, 0.05058097839355469, 0.054366111755371094, 0.0581512451171875, 0.061936378479003906, 0.06572151184082031, 0.06950664520263672, 0.07329177856445312, 0.07707691192626953, 0.08086204528808594, 0.08464717864990234, 0.08843231201171875, 0.09221744537353516, 0.09600257873535156, 0.09978771209716797, 0.10357284545898438, 0.10735797882080078, 0.11114311218261719, 0.1149282455444336, 0.11871337890625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 4.0, 5.0, 9.0, 11.0, 16.0, 21.0, 24.0, 41.0, 51.0, 71.0, 113.0, 136.0, 206.0, 288.0, 511.0, 922.0, 1795.0, 4271.0, 11152.0, 33080.0, 115840.0, 438113.0, 322489.0, 79765.0, 24062.0, 8390.0, 3319.0, 1604.0, 792.0, 460.0, 293.0, 213.0, 151.0, 107.0, 73.0, 52.0, 25.0, 28.0, 14.0, 12.0, 6.0, 5.0, 8.0, 5.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.306640625, -0.2960166931152344, -0.28539276123046875, -0.2747688293457031, -0.2641448974609375, -0.2535209655761719, -0.24289703369140625, -0.23227310180664062, -0.221649169921875, -0.21102523803710938, -0.20040130615234375, -0.18977737426757812, -0.1791534423828125, -0.16852951049804688, -0.15790557861328125, -0.14728164672851562, -0.13665771484375, -0.12603378295898438, -0.11540985107421875, -0.10478591918945312, -0.0941619873046875, -0.08353805541992188, -0.07291412353515625, -0.062290191650390625, -0.051666259765625, -0.041042327880859375, -0.03041839599609375, -0.019794464111328125, -0.0091705322265625, 0.001453399658203125, 0.01207733154296875, 0.022701263427734375, 0.0333251953125, 0.043949127197265625, 0.05457305908203125, 0.06519699096679688, 0.0758209228515625, 0.08644485473632812, 0.09706878662109375, 0.10769271850585938, 0.118316650390625, 0.12894058227539062, 0.13956451416015625, 0.15018844604492188, 0.1608123779296875, 0.17143630981445312, 0.18206024169921875, 0.19268417358398438, 0.20330810546875, 0.21393203735351562, 0.22455596923828125, 0.23517990112304688, 0.2458038330078125, 0.2564277648925781, 0.26705169677734375, 0.2776756286621094, 0.288299560546875, 0.2989234924316406, 0.30954742431640625, 0.3201713562011719, 0.3307952880859375, 0.3414192199707031, 0.35204315185546875, 0.3626670837402344, 0.373291015625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 8.0, 3.0, 10.0, 9.0, 6.0, 22.0, 13.0, 16.0, 23.0, 33.0, 28.0, 26.0, 48.0, 34.0, 34.0, 42.0, 43.0, 50.0, 59.0, 43.0, 37.0, 53.0, 55.0, 33.0, 35.0, 30.0, 14.0, 31.0, 26.0, 21.0, 22.0, 26.0, 9.0, 16.0, 17.0, 7.0, 7.0, 6.0, 3.0, 4.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.525390625, -0.509063720703125, -0.49273681640625, -0.476409912109375, -0.4600830078125, -0.443756103515625, -0.42742919921875, -0.411102294921875, -0.394775390625, -0.378448486328125, -0.36212158203125, -0.345794677734375, -0.3294677734375, -0.313140869140625, -0.29681396484375, -0.280487060546875, -0.26416015625, -0.247833251953125, -0.23150634765625, -0.215179443359375, -0.1988525390625, -0.182525634765625, -0.16619873046875, -0.149871826171875, -0.133544921875, -0.117218017578125, -0.10089111328125, -0.084564208984375, -0.0682373046875, -0.051910400390625, -0.03558349609375, -0.019256591796875, -0.0029296875, 0.013397216796875, 0.02972412109375, 0.046051025390625, 0.0623779296875, 0.078704833984375, 0.09503173828125, 0.111358642578125, 0.127685546875, 0.144012451171875, 0.16033935546875, 0.176666259765625, 0.1929931640625, 0.209320068359375, 0.22564697265625, 0.241973876953125, 0.25830078125, 0.274627685546875, 0.29095458984375, 0.307281494140625, 0.3236083984375, 0.339935302734375, 0.35626220703125, 0.372589111328125, 0.388916015625, 0.405242919921875, 0.42156982421875, 0.437896728515625, 0.4542236328125, 0.470550537109375, 0.48687744140625, 0.503204345703125, 0.51953125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 6.0, 6.0, 8.0, 9.0, 10.0, 13.0, 20.0, 23.0, 40.0, 44.0, 92.0, 134.0, 237.0, 417.0, 969.0, 2410.0, 7379.0, 41362.0, 886662.0, 92219.0, 10769.0, 3291.0, 1244.0, 532.0, 246.0, 151.0, 71.0, 43.0, 38.0, 39.0, 25.0, 14.0, 11.0, 6.0, 10.0, 7.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.74951171875, -0.7265472412109375, -0.703582763671875, -0.6806182861328125, -0.65765380859375, -0.6346893310546875, -0.611724853515625, -0.5887603759765625, -0.5657958984375, -0.5428314208984375, -0.519866943359375, -0.4969024658203125, -0.47393798828125, -0.4509735107421875, -0.428009033203125, -0.4050445556640625, -0.382080078125, -0.3591156005859375, -0.336151123046875, -0.3131866455078125, -0.29022216796875, -0.2672576904296875, -0.244293212890625, -0.2213287353515625, -0.1983642578125, -0.1753997802734375, -0.152435302734375, -0.1294708251953125, -0.10650634765625, -0.0835418701171875, -0.060577392578125, -0.0376129150390625, -0.0146484375, 0.0083160400390625, 0.031280517578125, 0.0542449951171875, 0.07720947265625, 0.1001739501953125, 0.123138427734375, 0.1461029052734375, 0.1690673828125, 0.1920318603515625, 0.214996337890625, 0.2379608154296875, 0.26092529296875, 0.2838897705078125, 0.306854248046875, 0.3298187255859375, 0.352783203125, 0.3757476806640625, 0.398712158203125, 0.4216766357421875, 0.44464111328125, 0.4676055908203125, 0.490570068359375, 0.5135345458984375, 0.5364990234375, 0.5594635009765625, 0.582427978515625, 0.6053924560546875, 0.62835693359375, 0.6513214111328125, 0.674285888671875, 0.6972503662109375, 0.72021484375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 2.0, 4.0, 13.0, 15.0, 14.0, 14.0, 29.0, 29.0, 53.0, 70.0, 97.0, 112.0, 102.0, 101.0, 87.0, 63.0, 44.0, 34.0, 31.0, 30.0, 13.0, 18.0, 7.0, 5.0, 3.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.6684017181396484e-05, -5.446188151836395e-05, -5.223974585533142e-05, -5.001761019229889e-05, -4.779547452926636e-05, -4.5573338866233826e-05, -4.3351203203201294e-05, -4.112906754016876e-05, -3.890693187713623e-05, -3.66847962141037e-05, -3.446266055107117e-05, -3.2240524888038635e-05, -3.0018389225006104e-05, -2.7796253561973572e-05, -2.557411789894104e-05, -2.3351982235908508e-05, -2.1129846572875977e-05, -1.8907710909843445e-05, -1.6685575246810913e-05, -1.4463439583778381e-05, -1.224130392074585e-05, -1.0019168257713318e-05, -7.797032594680786e-06, -5.574896931648254e-06, -3.3527612686157227e-06, -1.130625605583191e-06, 1.0915100574493408e-06, 3.3136457204818726e-06, 5.535781383514404e-06, 7.757917046546936e-06, 9.980052709579468e-06, 1.2202188372612e-05, 1.4424324035644531e-05, 1.6646459698677063e-05, 1.8868595361709595e-05, 2.1090731024742126e-05, 2.3312866687774658e-05, 2.553500235080719e-05, 2.775713801383972e-05, 2.9979273676872253e-05, 3.2201409339904785e-05, 3.442354500293732e-05, 3.664568066596985e-05, 3.886781632900238e-05, 4.108995199203491e-05, 4.3312087655067444e-05, 4.5534223318099976e-05, 4.775635898113251e-05, 4.997849464416504e-05, 5.220063030719757e-05, 5.44227659702301e-05, 5.6644901633262634e-05, 5.8867037296295166e-05, 6.10891729593277e-05, 6.331130862236023e-05, 6.553344428539276e-05, 6.775557994842529e-05, 6.997771561145782e-05, 7.219985127449036e-05, 7.442198693752289e-05, 7.664412260055542e-05, 7.886625826358795e-05, 8.108839392662048e-05, 8.331052958965302e-05, 8.553266525268555e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 8.0, 8.0, 10.0, 16.0, 20.0, 27.0, 45.0, 90.0, 122.0, 231.0, 445.0, 994.0, 3176.0, 12186.0, 87637.0, 812940.0, 110735.0, 13925.0, 3479.0, 1266.0, 551.0, 250.0, 143.0, 76.0, 54.0, 31.0, 25.0, 16.0, 10.0, 7.0, 5.0, 7.0, 1.0, 2.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4765625, -0.46096038818359375, -0.4453582763671875, -0.42975616455078125, -0.414154052734375, -0.39855194091796875, -0.3829498291015625, -0.36734771728515625, -0.35174560546875, -0.33614349365234375, -0.3205413818359375, -0.30493927001953125, -0.289337158203125, -0.27373504638671875, -0.2581329345703125, -0.24253082275390625, -0.2269287109375, -0.21132659912109375, -0.1957244873046875, -0.18012237548828125, -0.164520263671875, -0.14891815185546875, -0.1333160400390625, -0.11771392822265625, -0.10211181640625, -0.08650970458984375, -0.0709075927734375, -0.05530548095703125, -0.039703369140625, -0.02410125732421875, -0.0084991455078125, 0.00710296630859375, 0.022705078125, 0.03830718994140625, 0.0539093017578125, 0.06951141357421875, 0.085113525390625, 0.10071563720703125, 0.1163177490234375, 0.13191986083984375, 0.14752197265625, 0.16312408447265625, 0.1787261962890625, 0.19432830810546875, 0.209930419921875, 0.22553253173828125, 0.2411346435546875, 0.25673675537109375, 0.2723388671875, 0.28794097900390625, 0.3035430908203125, 0.31914520263671875, 0.334747314453125, 0.35034942626953125, 0.3659515380859375, 0.38155364990234375, 0.39715576171875, 0.41275787353515625, 0.4283599853515625, 0.44396209716796875, 0.459564208984375, 0.47516632080078125, 0.4907684326171875, 0.5063705444335938, 0.52197265625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 5.0, 1.0, 6.0, 6.0, 9.0, 15.0, 21.0, 34.0, 47.0, 73.0, 76.0, 118.0, 136.0, 118.0, 102.0, 76.0, 54.0, 27.0, 19.0, 14.0, 12.0, 6.0, 6.0, 10.0, 4.0, 4.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.6337890625, -0.6131668090820312, -0.5925445556640625, -0.5719223022460938, -0.551300048828125, -0.5306777954101562, -0.5100555419921875, -0.48943328857421875, -0.46881103515625, -0.44818878173828125, -0.4275665283203125, -0.40694427490234375, -0.386322021484375, -0.36569976806640625, -0.3450775146484375, -0.32445526123046875, -0.3038330078125, -0.28321075439453125, -0.2625885009765625, -0.24196624755859375, -0.221343994140625, -0.20072174072265625, -0.1800994873046875, -0.15947723388671875, -0.13885498046875, -0.11823272705078125, -0.0976104736328125, -0.07698822021484375, -0.056365966796875, -0.03574371337890625, -0.0151214599609375, 0.00550079345703125, 0.026123046875, 0.04674530029296875, 0.0673675537109375, 0.08798980712890625, 0.108612060546875, 0.12923431396484375, 0.1498565673828125, 0.17047882080078125, 0.19110107421875, 0.21172332763671875, 0.2323455810546875, 0.25296783447265625, 0.273590087890625, 0.29421234130859375, 0.3148345947265625, 0.33545684814453125, 0.3560791015625, 0.37670135498046875, 0.3973236083984375, 0.41794586181640625, 0.438568115234375, 0.45919036865234375, 0.4798126220703125, 0.5004348754882812, 0.52105712890625, 0.5416793823242188, 0.5623016357421875, 0.5829238891601562, 0.603546142578125, 0.6241683959960938, 0.6447906494140625, 0.6654129028320312, 0.68603515625]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 6.0, 1.0, 3.0, 12.0, 7.0, 27.0, 114.0, 391.0, 315.0, 69.0, 30.0, 8.0, 6.0, 5.0, 4.0, 1.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-12.18556022644043, -11.925686836242676, -11.665812492370605, -11.405939102172852, -11.146064758300781, -10.886191368103027, -10.626317977905273, -10.366443634033203, -10.10657024383545, -9.846696853637695, -9.586822509765625, -9.326949119567871, -9.0670747756958, -8.807201385498047, -8.547327041625977, -8.287453651428223, -8.027580261230469, -7.767706394195557, -7.5078325271606445, -7.247959136962891, -6.9880852699279785, -6.728211402893066, -6.468337535858154, -6.208463668823242, -5.948589324951172, -5.68871545791626, -5.428841590881348, -5.168968200683594, -4.909094333648682, -4.6492204666137695, -4.389346599578857, -4.129472732543945, -3.8695998191833496, -3.6097259521484375, -3.3498523235321045, -3.0899784564971924, -2.8301048278808594, -2.5702309608459473, -2.310357093811035, -2.050483226776123, -1.79060959815979, -1.5307358503341675, -1.270862102508545, -1.0109882354736328, -0.7511144876480103, -0.4912407398223877, -0.23136687278747559, 0.028506875038146973, 0.28838062286376953, 0.5482543706893921, 0.8081281781196594, 1.0680019855499268, 1.3278757333755493, 1.5877494812011719, 1.847623348236084, 2.107497215270996, 2.367370843887329, 2.627244710922241, 2.887118339538574, 3.1469922065734863, 3.4068660736083984, 3.6667397022247314, 3.9266135692596436, 4.186487197875977, 4.446361064910889]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 2.0, 2.0, 4.0, 2.0, 7.0, 5.0, 8.0, 8.0, 15.0, 19.0, 12.0, 36.0, 63.0, 100.0, 106.0, 159.0, 138.0, 115.0, 68.0, 37.0, 21.0, 15.0, 9.0, 6.0, 4.0, 5.0, 3.0, 6.0, 3.0, 5.0, 2.0, 2.0, 2.0, 1.0, 2.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.108667373657227, -8.811705589294434, -8.514742851257324, -8.217781066894531, -7.92081880569458, -7.623856544494629, -7.326894760131836, -7.029932498931885, -6.732970237731934, -6.436007976531982, -6.1390461921691895, -5.842083930969238, -5.545121669769287, -5.248159408569336, -4.951197624206543, -4.654235363006592, -4.357273578643799, -4.060311317443848, -3.7633492946624756, -3.4663872718811035, -3.1694250106811523, -2.8724629878997803, -2.575500965118408, -2.278538703918457, -1.981576681137085, -1.6846145391464233, -1.3876523971557617, -1.0906903743743896, -0.793728232383728, -0.4967660903930664, -0.19980406761169434, 0.09715819358825684, 0.3941202163696289, 0.6910823583602905, 0.9880444407463074, 1.2850065231323242, 1.5819686651229858, 1.8789308071136475, 2.1758928298950195, 2.4728550910949707, 2.7698171138763428, 3.066779136657715, 3.363741397857666, 3.660703420639038, 3.95766544342041, 4.254627704620361, 4.5515899658203125, 4.8485517501831055, 5.145514011383057, 5.442476272583008, 5.739438056945801, 6.036400318145752, 6.333362579345703, 6.630324363708496, 6.927286624908447, 7.224248886108398, 7.521210670471191, 7.818172931671143, 8.115135192871094, 8.412096977233887, 8.70905876159668, 9.006021499633789, 9.302983283996582, 9.599945068359375, 9.896907806396484]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 3.0, 7.0, 11.0, 10.0, 12.0, 13.0, 24.0, 23.0, 34.0, 46.0, 72.0, 80.0, 101.0, 155.0, 224.0, 328.0, 448.0, 692.0, 1100.0, 1722.0, 3172.0, 5849.0, 14264.0, 52684.0, 3512929.0, 524048.0, 44905.0, 14708.0, 6866.0, 3562.0, 2232.0, 1361.0, 875.0, 555.0, 368.0, 251.0, 162.0, 140.0, 69.0, 58.0, 35.0, 33.0, 10.0, 12.0, 14.0, 5.0, 2.0, 5.0, 1.0, 1.0, 4.0], "bins": [-1.1318359375, -1.1019744873046875, -1.072113037109375, -1.0422515869140625, -1.01239013671875, -0.9825286865234375, -0.952667236328125, -0.9228057861328125, -0.8929443359375, -0.8630828857421875, -0.833221435546875, -0.8033599853515625, -0.77349853515625, -0.7436370849609375, -0.713775634765625, -0.6839141845703125, -0.654052734375, -0.6241912841796875, -0.594329833984375, -0.5644683837890625, -0.53460693359375, -0.5047454833984375, -0.474884033203125, -0.4450225830078125, -0.4151611328125, -0.3852996826171875, -0.355438232421875, -0.3255767822265625, -0.29571533203125, -0.2658538818359375, -0.235992431640625, -0.2061309814453125, -0.17626953125, -0.1464080810546875, -0.116546630859375, -0.0866851806640625, -0.05682373046875, -0.0269622802734375, 0.002899169921875, 0.0327606201171875, 0.0626220703125, 0.0924835205078125, 0.122344970703125, 0.1522064208984375, 0.18206787109375, 0.2119293212890625, 0.241790771484375, 0.2716522216796875, 0.301513671875, 0.3313751220703125, 0.361236572265625, 0.3910980224609375, 0.42095947265625, 0.4508209228515625, 0.480682373046875, 0.5105438232421875, 0.5404052734375, 0.5702667236328125, 0.600128173828125, 0.6299896240234375, 0.65985107421875, 0.6897125244140625, 0.719573974609375, 0.7494354248046875, 0.779296875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 5.0, 0.0, 4.0, 6.0, 4.0, 3.0, 4.0, 3.0, 6.0, 12.0, 12.0, 19.0, 22.0, 54.0, 192.0, 355.0, 164.0, 36.0, 21.0, 7.0, 7.0, 10.0, 10.0, 8.0, 2.0, 3.0, 8.0, 6.0, 5.0, 6.0, 3.0, 6.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.1473388671875, -0.14342117309570312, -0.13950347900390625, -0.13558578491210938, -0.1316680908203125, -0.12775039672851562, -0.12383270263671875, -0.11991500854492188, -0.115997314453125, -0.11207962036132812, -0.10816192626953125, -0.10424423217773438, -0.1003265380859375, -0.09640884399414062, -0.09249114990234375, -0.08857345581054688, -0.08465576171875, -0.08073806762695312, -0.07682037353515625, -0.07290267944335938, -0.0689849853515625, -0.06506729125976562, -0.06114959716796875, -0.057231903076171875, -0.053314208984375, -0.049396514892578125, -0.04547882080078125, -0.041561126708984375, -0.0376434326171875, -0.033725738525390625, -0.02980804443359375, -0.025890350341796875, -0.02197265625, -0.018054962158203125, -0.01413726806640625, -0.010219573974609375, -0.0063018798828125, -0.002384185791015625, 0.00153350830078125, 0.005451202392578125, 0.009368896484375, 0.013286590576171875, 0.01720428466796875, 0.021121978759765625, 0.0250396728515625, 0.028957366943359375, 0.03287506103515625, 0.036792755126953125, 0.04071044921875, 0.044628143310546875, 0.04854583740234375, 0.052463531494140625, 0.0563812255859375, 0.060298919677734375, 0.06421661376953125, 0.06813430786132812, 0.072052001953125, 0.07596969604492188, 0.07988739013671875, 0.08380508422851562, 0.0877227783203125, 0.09164047241210938, 0.09555816650390625, 0.09947586059570312, 0.1033935546875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 7.0, 1.0, 10.0, 12.0, 11.0, 19.0, 20.0, 33.0, 56.0, 69.0, 122.0, 186.0, 333.0, 571.0, 1024.0, 2258.0, 5739.0, 18919.0, 108892.0, 3365410.0, 625314.0, 46345.0, 11059.0, 3871.0, 1784.0, 845.0, 503.0, 313.0, 211.0, 99.0, 59.0, 46.0, 46.0, 21.0, 21.0, 11.0, 10.0, 10.0, 6.0, 6.0, 2.0, 3.0, 5.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4658203125, -0.44775390625, -0.4296875, -0.41162109375, -0.3935546875, -0.37548828125, -0.357421875, -0.33935546875, -0.3212890625, -0.30322265625, -0.28515625, -0.26708984375, -0.2490234375, -0.23095703125, -0.212890625, -0.19482421875, -0.1767578125, -0.15869140625, -0.140625, -0.12255859375, -0.1044921875, -0.08642578125, -0.068359375, -0.05029296875, -0.0322265625, -0.01416015625, 0.00390625, 0.02197265625, 0.0400390625, 0.05810546875, 0.076171875, 0.09423828125, 0.1123046875, 0.13037109375, 0.1484375, 0.16650390625, 0.1845703125, 0.20263671875, 0.220703125, 0.23876953125, 0.2568359375, 0.27490234375, 0.29296875, 0.31103515625, 0.3291015625, 0.34716796875, 0.365234375, 0.38330078125, 0.4013671875, 0.41943359375, 0.4375, 0.45556640625, 0.4736328125, 0.49169921875, 0.509765625, 0.52783203125, 0.5458984375, 0.56396484375, 0.58203125, 0.60009765625, 0.6181640625, 0.63623046875, 0.654296875, 0.67236328125, 0.6904296875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 3.0, 3.0, 6.0, 6.0, 7.0, 9.0, 12.0, 19.0, 27.0, 26.0, 48.0, 107.0, 234.0, 527.0, 1598.0, 780.0, 282.0, 137.0, 82.0, 45.0, 30.0, 17.0, 20.0, 11.0, 11.0, 9.0, 7.0, 2.0, 6.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.146240234375, -0.1413249969482422, -0.13640975952148438, -0.13149452209472656, -0.12657928466796875, -0.12166404724121094, -0.11674880981445312, -0.11183357238769531, -0.1069183349609375, -0.10200309753417969, -0.09708786010742188, -0.09217262268066406, -0.08725738525390625, -0.08234214782714844, -0.07742691040039062, -0.07251167297363281, -0.067596435546875, -0.06268119812011719, -0.057765960693359375, -0.05285072326660156, -0.04793548583984375, -0.04302024841308594, -0.038105010986328125, -0.03318977355957031, -0.0282745361328125, -0.023359298706054688, -0.018444061279296875, -0.013528823852539062, -0.00861358642578125, -0.0036983489990234375, 0.001216888427734375, 0.0061321258544921875, 0.01104736328125, 0.015962600708007812, 0.020877838134765625, 0.025793075561523438, 0.03070831298828125, 0.03562355041503906, 0.040538787841796875, 0.04545402526855469, 0.0503692626953125, 0.05528450012207031, 0.060199737548828125, 0.06511497497558594, 0.07003021240234375, 0.07494544982910156, 0.07986068725585938, 0.08477592468261719, 0.089691162109375, 0.09460639953613281, 0.09952163696289062, 0.10443687438964844, 0.10935211181640625, 0.11426734924316406, 0.11918258666992188, 0.12409782409667969, 0.1290130615234375, 0.1339282989501953, 0.13884353637695312, 0.14375877380371094, 0.14867401123046875, 0.15358924865722656, 0.15850448608398438, 0.1634197235107422, 0.1683349609375]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 1.0, 7.0, 17.0, 81.0, 394.0, 403.0, 65.0, 20.0, 3.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.229240894317627, -1.1784467697143555, -1.127652645111084, -1.0768585205078125, -1.0260645151138306, -0.9752703905105591, -0.9244762659072876, -0.8736821413040161, -0.8228880763053894, -0.7720939517021179, -0.7212998867034912, -0.6705057621002197, -0.6197116374969482, -0.5689175724983215, -0.51812344789505, -0.46732935309410095, -0.41653525829315186, -0.36574116349220276, -0.31494706869125366, -0.2641529440879822, -0.21335884928703308, -0.16256475448608398, -0.1117706298828125, -0.0609765350818634, -0.010182440280914307, 0.04061166197061539, 0.09140576422214508, 0.14219987392425537, 0.19299396872520447, 0.24378806352615356, 0.29458218812942505, 0.34537628293037415, 0.39617037773132324, 0.44696447253227234, 0.49775856733322144, 0.5485526919364929, 0.5993467569351196, 0.6501408815383911, 0.7009350061416626, 0.7517291307449341, 0.8025231957435608, 0.8533173203468323, 0.904111385345459, 0.9549055099487305, 1.005699634552002, 1.0564937591552734, 1.107287883758545, 1.1580818891525269, 1.2088760137557983, 1.2596701383590698, 1.3104642629623413, 1.3612582683563232, 1.4120523929595947, 1.4628465175628662, 1.5136406421661377, 1.5644347667694092, 1.6152288913726807, 1.6660230159759521, 1.7168171405792236, 1.7676112651824951, 1.818405270576477, 1.8691993951797485, 1.91999351978302, 1.9707876443862915, 2.0215816497802734]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 3.0, 4.0, 4.0, 2.0, 4.0, 4.0, 9.0, 16.0, 6.0, 20.0, 32.0, 50.0, 49.0, 55.0, 88.0, 91.0, 102.0, 92.0, 92.0, 73.0, 54.0, 58.0, 20.0, 20.0, 22.0, 14.0, 6.0, 3.0, 5.0, 3.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.8361510038375854, -0.8090371489524841, -0.7819233536720276, -0.7548094987869263, -0.727695643901825, -0.7005817890167236, -0.6734679937362671, -0.6463541388511658, -0.6192402839660645, -0.5921264290809631, -0.5650126338005066, -0.5378987789154053, -0.510784924030304, -0.483671098947525, -0.4565572738647461, -0.4294434189796448, -0.40232962369918823, -0.3752157986164093, -0.348101943731308, -0.32098811864852905, -0.29387426376342773, -0.2667604386806488, -0.23964661359786987, -0.21253277361392975, -0.18541893362998962, -0.1583050936460495, -0.13119125366210938, -0.10407742857933044, -0.07696358859539032, -0.049849748611450195, -0.022735923528671265, 0.00437791645526886, 0.03149169683456421, 0.058605533093214035, 0.08571936935186386, 0.11283320188522339, 0.1399470418691635, 0.16706088185310364, 0.19417470693588257, 0.2212885469198227, 0.24840238690376282, 0.27551621198654175, 0.30263006687164307, 0.329743891954422, 0.3568577170372009, 0.38397157192230225, 0.4110853970050812, 0.4381992220878601, 0.4653130769729614, 0.49242690205574036, 0.5195407271385193, 0.5466545820236206, 0.5737684369087219, 0.6008822917938232, 0.6279960870742798, 0.6551099419593811, 0.6822237968444824, 0.7093376517295837, 0.7364514470100403, 0.7635653018951416, 0.7906791567802429, 0.8177930116653442, 0.8449068069458008, 0.8720206618309021, 0.8991344571113586]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 5.0, 3.0, 12.0, 10.0, 17.0, 15.0, 32.0, 50.0, 86.0, 102.0, 136.0, 255.0, 383.0, 620.0, 1151.0, 2107.0, 4033.0, 8214.0, 18547.0, 56435.0, 761295.0, 146336.0, 26272.0, 10862.0, 5305.0, 2658.0, 1424.0, 824.0, 459.0, 323.0, 183.0, 120.0, 86.0, 63.0, 37.0, 29.0, 18.0, 14.0, 13.0, 7.0, 3.0, 4.0, 2.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.7265625, -0.7050018310546875, -0.683441162109375, -0.6618804931640625, -0.64031982421875, -0.6187591552734375, -0.597198486328125, -0.5756378173828125, -0.5540771484375, -0.5325164794921875, -0.510955810546875, -0.4893951416015625, -0.46783447265625, -0.4462738037109375, -0.424713134765625, -0.4031524658203125, -0.381591796875, -0.3600311279296875, -0.338470458984375, -0.3169097900390625, -0.29534912109375, -0.2737884521484375, -0.252227783203125, -0.2306671142578125, -0.2091064453125, -0.1875457763671875, -0.165985107421875, -0.1444244384765625, -0.12286376953125, -0.1013031005859375, -0.079742431640625, -0.0581817626953125, -0.03662109375, -0.0150604248046875, 0.006500244140625, 0.0280609130859375, 0.04962158203125, 0.0711822509765625, 0.092742919921875, 0.1143035888671875, 0.1358642578125, 0.1574249267578125, 0.178985595703125, 0.2005462646484375, 0.22210693359375, 0.2436676025390625, 0.265228271484375, 0.2867889404296875, 0.308349609375, 0.3299102783203125, 0.351470947265625, 0.3730316162109375, 0.39459228515625, 0.4161529541015625, 0.437713623046875, 0.4592742919921875, 0.4808349609375, 0.5023956298828125, 0.523956298828125, 0.5455169677734375, 0.56707763671875, 0.5886383056640625, 0.610198974609375, 0.6317596435546875, 0.6533203125]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 4.0, 2.0, 3.0, 3.0, 9.0, 5.0, 18.0, 18.0, 19.0, 35.0, 100.0, 223.0, 279.0, 134.0, 51.0, 14.0, 18.0, 10.0, 5.0, 10.0, 7.0, 9.0, 4.0, 5.0, 3.0, 8.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1492919921875, -0.1454010009765625, -0.141510009765625, -0.1376190185546875, -0.13372802734375, -0.1298370361328125, -0.125946044921875, -0.1220550537109375, -0.1181640625, -0.1142730712890625, -0.110382080078125, -0.1064910888671875, -0.10260009765625, -0.0987091064453125, -0.094818115234375, -0.0909271240234375, -0.0870361328125, -0.0831451416015625, -0.079254150390625, -0.0753631591796875, -0.07147216796875, -0.0675811767578125, -0.063690185546875, -0.0597991943359375, -0.055908203125, -0.0520172119140625, -0.048126220703125, -0.0442352294921875, -0.04034423828125, -0.0364532470703125, -0.032562255859375, -0.0286712646484375, -0.0247802734375, -0.0208892822265625, -0.016998291015625, -0.0131072998046875, -0.00921630859375, -0.0053253173828125, -0.001434326171875, 0.0024566650390625, 0.00634765625, 0.0102386474609375, 0.014129638671875, 0.0180206298828125, 0.02191162109375, 0.0258026123046875, 0.029693603515625, 0.0335845947265625, 0.0374755859375, 0.0413665771484375, 0.045257568359375, 0.0491485595703125, 0.05303955078125, 0.0569305419921875, 0.060821533203125, 0.0647125244140625, 0.068603515625, 0.0724945068359375, 0.076385498046875, 0.0802764892578125, 0.08416748046875, 0.0880584716796875, 0.091949462890625, 0.0958404541015625, 0.0997314453125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 2.0, 7.0, 17.0, 38.0, 62.0, 176.0, 467.0, 1540.0, 7630.0, 77468.0, 804403.0, 142914.0, 10891.0, 1990.0, 576.0, 183.0, 86.0, 48.0, 14.0, 12.0, 9.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.76025390625, -0.7361984252929688, -0.7121429443359375, -0.6880874633789062, -0.664031982421875, -0.6399765014648438, -0.6159210205078125, -0.5918655395507812, -0.56781005859375, -0.5437545776367188, -0.5196990966796875, -0.49564361572265625, -0.471588134765625, -0.44753265380859375, -0.4234771728515625, -0.39942169189453125, -0.3753662109375, -0.35131072998046875, -0.3272552490234375, -0.30319976806640625, -0.279144287109375, -0.25508880615234375, -0.2310333251953125, -0.20697784423828125, -0.18292236328125, -0.15886688232421875, -0.1348114013671875, -0.11075592041015625, -0.086700439453125, -0.06264495849609375, -0.0385894775390625, -0.01453399658203125, 0.009521484375, 0.03357696533203125, 0.0576324462890625, 0.08168792724609375, 0.105743408203125, 0.12979888916015625, 0.1538543701171875, 0.17790985107421875, 0.20196533203125, 0.22602081298828125, 0.2500762939453125, 0.27413177490234375, 0.298187255859375, 0.32224273681640625, 0.3462982177734375, 0.37035369873046875, 0.3944091796875, 0.41846466064453125, 0.4425201416015625, 0.46657562255859375, 0.490631103515625, 0.5146865844726562, 0.5387420654296875, 0.5627975463867188, 0.58685302734375, 0.6109085083007812, 0.6349639892578125, 0.6590194702148438, 0.683074951171875, 0.7071304321289062, 0.7311859130859375, 0.7552413940429688, 0.779296875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 4.0, 3.0, 2.0, 6.0, 9.0, 7.0, 7.0, 17.0, 17.0, 24.0, 32.0, 30.0, 29.0, 20.0, 34.0, 40.0, 34.0, 35.0, 37.0, 43.0, 39.0, 42.0, 53.0, 40.0, 48.0, 42.0, 37.0, 30.0, 34.0, 34.0, 28.0, 33.0, 23.0, 19.0, 9.0, 21.0, 7.0, 12.0, 8.0, 4.0, 3.0, 6.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.341064453125, -0.33090972900390625, -0.3207550048828125, -0.31060028076171875, -0.300445556640625, -0.29029083251953125, -0.2801361083984375, -0.26998138427734375, -0.25982666015625, -0.24967193603515625, -0.2395172119140625, -0.22936248779296875, -0.219207763671875, -0.20905303955078125, -0.1988983154296875, -0.18874359130859375, -0.1785888671875, -0.16843414306640625, -0.1582794189453125, -0.14812469482421875, -0.137969970703125, -0.12781524658203125, -0.1176605224609375, -0.10750579833984375, -0.09735107421875, -0.08719635009765625, -0.0770416259765625, -0.06688690185546875, -0.056732177734375, -0.04657745361328125, -0.0364227294921875, -0.02626800537109375, -0.01611328125, -0.00595855712890625, 0.0041961669921875, 0.01435089111328125, 0.024505615234375, 0.03466033935546875, 0.0448150634765625, 0.05496978759765625, 0.06512451171875, 0.07527923583984375, 0.0854339599609375, 0.09558868408203125, 0.105743408203125, 0.11589813232421875, 0.1260528564453125, 0.13620758056640625, 0.1463623046875, 0.15651702880859375, 0.1666717529296875, 0.17682647705078125, 0.186981201171875, 0.19713592529296875, 0.2072906494140625, 0.21744537353515625, 0.22760009765625, 0.23775482177734375, 0.2479095458984375, 0.25806427001953125, 0.268218994140625, 0.27837371826171875, 0.2885284423828125, 0.29868316650390625, 0.308837890625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 2.0, 2.0, 5.0, 8.0, 7.0, 16.0, 23.0, 39.0, 55.0, 78.0, 132.0, 220.0, 517.0, 1030.0, 2923.0, 13091.0, 270600.0, 733426.0, 20043.0, 3867.0, 1236.0, 554.0, 285.0, 157.0, 82.0, 53.0, 32.0, 18.0, 17.0, 8.0, 8.0, 6.0, 7.0, 4.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.99169921875, -0.9564132690429688, -0.9211273193359375, -0.8858413696289062, -0.850555419921875, -0.8152694702148438, -0.7799835205078125, -0.7446975708007812, -0.70941162109375, -0.6741256713867188, -0.6388397216796875, -0.6035537719726562, -0.568267822265625, -0.5329818725585938, -0.4976959228515625, -0.46240997314453125, -0.4271240234375, -0.39183807373046875, -0.3565521240234375, -0.32126617431640625, -0.285980224609375, -0.25069427490234375, -0.2154083251953125, -0.18012237548828125, -0.14483642578125, -0.10955047607421875, -0.0742645263671875, -0.03897857666015625, -0.003692626953125, 0.03159332275390625, 0.0668792724609375, 0.10216522216796875, 0.137451171875, 0.17273712158203125, 0.2080230712890625, 0.24330902099609375, 0.278594970703125, 0.31388092041015625, 0.3491668701171875, 0.38445281982421875, 0.41973876953125, 0.45502471923828125, 0.4903106689453125, 0.5255966186523438, 0.560882568359375, 0.5961685180664062, 0.6314544677734375, 0.6667404174804688, 0.7020263671875, 0.7373123168945312, 0.7725982666015625, 0.8078842163085938, 0.843170166015625, 0.8784561157226562, 0.9137420654296875, 0.9490280151367188, 0.98431396484375, 1.0195999145507812, 1.0548858642578125, 1.0901718139648438, 1.125457763671875, 1.1607437133789062, 1.1960296630859375, 1.2313156127929688, 1.2666015625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 5.0, 5.0, 4.0, 9.0, 13.0, 12.0, 19.0, 34.0, 64.0, 104.0, 139.0, 184.0, 159.0, 86.0, 53.0, 30.0, 31.0, 14.0, 13.0, 6.0, 6.0, 6.0, 1.0, 1.0, 1.0, 1.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00019431114196777344, -0.0001881122589111328, -0.0001819133758544922, -0.00017571449279785156, -0.00016951560974121094, -0.0001633167266845703, -0.0001571178436279297, -0.00015091896057128906, -0.00014472007751464844, -0.0001385211944580078, -0.0001323223114013672, -0.00012612342834472656, -0.00011992454528808594, -0.00011372566223144531, -0.00010752677917480469, -0.00010132789611816406, -9.512901306152344e-05, -8.893013000488281e-05, -8.273124694824219e-05, -7.653236389160156e-05, -7.033348083496094e-05, -6.413459777832031e-05, -5.793571472167969e-05, -5.173683166503906e-05, -4.553794860839844e-05, -3.933906555175781e-05, -3.314018249511719e-05, -2.6941299438476562e-05, -2.0742416381835938e-05, -1.4543533325195312e-05, -8.344650268554688e-06, -2.1457672119140625e-06, 4.0531158447265625e-06, 1.0251998901367188e-05, 1.6450881958007812e-05, 2.2649765014648438e-05, 2.8848648071289062e-05, 3.504753112792969e-05, 4.124641418457031e-05, 4.744529724121094e-05, 5.364418029785156e-05, 5.984306335449219e-05, 6.604194641113281e-05, 7.224082946777344e-05, 7.843971252441406e-05, 8.463859558105469e-05, 9.083747863769531e-05, 9.703636169433594e-05, 0.00010323524475097656, 0.00010943412780761719, 0.00011563301086425781, 0.00012183189392089844, 0.00012803077697753906, 0.0001342296600341797, 0.0001404285430908203, 0.00014662742614746094, 0.00015282630920410156, 0.0001590251922607422, 0.0001652240753173828, 0.00017142295837402344, 0.00017762184143066406, 0.0001838207244873047, 0.0001900196075439453, 0.00019621849060058594, 0.00020241737365722656]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 4.0, 3.0, 8.0, 3.0, 7.0, 14.0, 16.0, 28.0, 40.0, 50.0, 86.0, 165.0, 303.0, 617.0, 1578.0, 4605.0, 18589.0, 160209.0, 769605.0, 73949.0, 12342.0, 3543.0, 1334.0, 616.0, 335.0, 180.0, 99.0, 69.0, 48.0, 33.0, 24.0, 18.0, 6.0, 7.0, 6.0, 4.0, 6.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5087890625, -0.48947906494140625, -0.4701690673828125, -0.45085906982421875, -0.431549072265625, -0.41223907470703125, -0.3929290771484375, -0.37361907958984375, -0.35430908203125, -0.33499908447265625, -0.3156890869140625, -0.29637908935546875, -0.277069091796875, -0.25775909423828125, -0.2384490966796875, -0.21913909912109375, -0.1998291015625, -0.18051910400390625, -0.1612091064453125, -0.14189910888671875, -0.122589111328125, -0.10327911376953125, -0.0839691162109375, -0.06465911865234375, -0.04534912109375, -0.02603912353515625, -0.0067291259765625, 0.01258087158203125, 0.031890869140625, 0.05120086669921875, 0.0705108642578125, 0.08982086181640625, 0.109130859375, 0.12844085693359375, 0.1477508544921875, 0.16706085205078125, 0.186370849609375, 0.20568084716796875, 0.2249908447265625, 0.24430084228515625, 0.26361083984375, 0.28292083740234375, 0.3022308349609375, 0.32154083251953125, 0.340850830078125, 0.36016082763671875, 0.3794708251953125, 0.39878082275390625, 0.4180908203125, 0.43740081787109375, 0.4567108154296875, 0.47602081298828125, 0.495330810546875, 0.5146408081054688, 0.5339508056640625, 0.5532608032226562, 0.57257080078125, 0.5918807983398438, 0.6111907958984375, 0.6305007934570312, 0.649810791015625, 0.6691207885742188, 0.6884307861328125, 0.7077407836914062, 0.72705078125]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 0.0, 4.0, 1.0, 5.0, 5.0, 4.0, 4.0, 5.0, 2.0, 13.0, 10.0, 17.0, 29.0, 38.0, 33.0, 63.0, 91.0, 98.0, 103.0, 116.0, 88.0, 66.0, 47.0, 37.0, 29.0, 20.0, 14.0, 23.0, 8.0, 3.0, 6.0, 7.0, 4.0, 4.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.361083984375, -0.3465080261230469, -0.33193206787109375, -0.3173561096191406, -0.3027801513671875, -0.2882041931152344, -0.27362823486328125, -0.2590522766113281, -0.244476318359375, -0.22990036010742188, -0.21532440185546875, -0.20074844360351562, -0.1861724853515625, -0.17159652709960938, -0.15702056884765625, -0.14244461059570312, -0.12786865234375, -0.11329269409179688, -0.09871673583984375, -0.08414077758789062, -0.0695648193359375, -0.054988861083984375, -0.04041290283203125, -0.025836944580078125, -0.011260986328125, 0.003314971923828125, 0.01789093017578125, 0.032466888427734375, 0.0470428466796875, 0.061618804931640625, 0.07619476318359375, 0.09077072143554688, 0.1053466796875, 0.11992263793945312, 0.13449859619140625, 0.14907455444335938, 0.1636505126953125, 0.17822647094726562, 0.19280242919921875, 0.20737838745117188, 0.221954345703125, 0.23653030395507812, 0.25110626220703125, 0.2656822204589844, 0.2802581787109375, 0.2948341369628906, 0.30941009521484375, 0.3239860534667969, 0.33856201171875, 0.3531379699707031, 0.36771392822265625, 0.3822898864746094, 0.3968658447265625, 0.4114418029785156, 0.42601776123046875, 0.4405937194824219, 0.455169677734375, 0.4697456359863281, 0.48432159423828125, 0.4988975524902344, 0.5134735107421875, 0.5280494689941406, 0.5426254272460938, 0.5572013854980469, 0.57177734375]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 7.0, 16.0, 88.0, 436.0, 381.0, 48.0, 13.0, 10.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.177377223968506, -6.9203948974609375, -6.663412094116211, -6.406429767608643, -6.149447441101074, -5.892464637756348, -5.635482311248779, -5.378499984741211, -5.121517181396484, -4.864534854888916, -4.6075520515441895, -4.350569725036621, -4.093587398529053, -3.8366048336029053, -3.579622268676758, -3.3226399421691895, -3.065657615661621, -2.8086750507354736, -2.5516927242279053, -2.294710159301758, -2.0377278327941895, -1.780745267868042, -1.5237627029418945, -1.2667802572250366, -1.0097978115081787, -0.7528153657913208, -0.4958328604698181, -0.23885035514831543, 0.01813209056854248, 0.2751145362854004, 0.5320971012115479, 0.7890795469284058, 1.0460624694824219, 1.3030449151992798, 1.5600273609161377, 1.8170099258422852, 2.0739922523498535, 2.330974817276001, 2.5879573822021484, 2.844939708709717, 3.1019222736358643, 3.3589048385620117, 3.61588716506958, 3.8728697299957275, 4.129852294921875, 4.386834621429443, 4.643816947937012, 4.900799751281738, 5.157782077789307, 5.414764404296875, 5.671747207641602, 5.92872953414917, 6.185711860656738, 6.442694664001465, 6.699676990509033, 6.956659317016602, 7.213642120361328, 7.4706244468688965, 7.727607250213623, 7.984589576721191, 8.241572380065918, 8.498554229736328, 8.755537033081055, 9.012519836425781, 9.269501686096191]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 5.0, 9.0, 7.0, 13.0, 24.0, 25.0, 52.0, 72.0, 76.0, 95.0, 111.0, 137.0, 93.0, 80.0, 58.0, 49.0, 24.0, 18.0, 11.0, 14.0, 3.0, 7.0, 5.0, 2.0, 5.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.342592239379883, -4.184720516204834, -4.026848793029785, -3.8689773082733154, -3.7111055850982666, -3.5532338619232178, -3.395362377166748, -3.237490653991699, -3.0796189308166504, -2.9217472076416016, -2.7638754844665527, -2.606003999710083, -2.448132276535034, -2.2902605533599854, -2.1323890686035156, -1.9745173454284668, -1.816645622253418, -1.6587738990783691, -1.5009022951126099, -1.3430306911468506, -1.1851589679718018, -1.027287244796753, -0.8694156408309937, -0.7115440368652344, -0.5536723136901855, -0.3958006501197815, -0.23792898654937744, -0.08005732297897339, 0.07781434059143066, 0.23568600416183472, 0.39355766773223877, 0.551429271697998, 0.7093014717102051, 0.8671731352806091, 1.0250447988510132, 1.1829164028167725, 1.3407881259918213, 1.4986598491668701, 1.6565314531326294, 1.8144030570983887, 1.9722747802734375, 2.1301465034484863, 2.288018226623535, 2.445889711380005, 2.6037614345550537, 2.7616331577301025, 2.9195046424865723, 3.077376365661621, 3.23524808883667, 3.3931198120117188, 3.5509915351867676, 3.7088630199432373, 3.866734743118286, 4.024606227874756, 4.182477951049805, 4.3403496742248535, 4.498221397399902, 4.656093120574951, 4.81396484375, 4.971836566925049, 5.129708290100098, 5.287579536437988, 5.445451259613037, 5.603322982788086, 5.761194705963135]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 7.0, 2.0, 8.0, 9.0, 6.0, 14.0, 7.0, 8.0, 12.0, 13.0, 22.0, 18.0, 24.0, 28.0, 40.0, 57.0, 114.0, 138.0, 198.0, 318.0, 573.0, 1059.0, 2154.0, 6703.0, 45841.0, 4052735.0, 68540.0, 8644.0, 3020.0, 1545.0, 870.0, 554.0, 370.0, 210.0, 129.0, 92.0, 65.0, 44.0, 24.0, 20.0, 17.0, 15.0, 11.0, 5.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.388671875, -2.3250732421875, -2.261474609375, -2.1978759765625, -2.13427734375, -2.0706787109375, -2.007080078125, -1.9434814453125, -1.8798828125, -1.8162841796875, -1.752685546875, -1.6890869140625, -1.62548828125, -1.5618896484375, -1.498291015625, -1.4346923828125, -1.37109375, -1.3074951171875, -1.243896484375, -1.1802978515625, -1.11669921875, -1.0531005859375, -0.989501953125, -0.9259033203125, -0.8623046875, -0.7987060546875, -0.735107421875, -0.6715087890625, -0.60791015625, -0.5443115234375, -0.480712890625, -0.4171142578125, -0.353515625, -0.2899169921875, -0.226318359375, -0.1627197265625, -0.09912109375, -0.0355224609375, 0.028076171875, 0.0916748046875, 0.1552734375, 0.2188720703125, 0.282470703125, 0.3460693359375, 0.40966796875, 0.4732666015625, 0.536865234375, 0.6004638671875, 0.6640625, 0.7276611328125, 0.791259765625, 0.8548583984375, 0.91845703125, 0.9820556640625, 1.045654296875, 1.1092529296875, 1.1728515625, 1.2364501953125, 1.300048828125, 1.3636474609375, 1.42724609375, 1.4908447265625, 1.554443359375, 1.6180419921875, 1.681640625]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 4.0, 7.0, 5.0, 6.0, 8.0, 18.0, 28.0, 58.0, 131.0, 248.0, 234.0, 114.0, 50.0, 25.0, 11.0, 9.0, 10.0, 11.0, 6.0, 5.0, 4.0, 6.0, 6.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1632080078125, -0.15892410278320312, -0.15464019775390625, -0.15035629272460938, -0.1460723876953125, -0.14178848266601562, -0.13750457763671875, -0.13322067260742188, -0.128936767578125, -0.12465286254882812, -0.12036895751953125, -0.11608505249023438, -0.1118011474609375, -0.10751724243164062, -0.10323333740234375, -0.09894943237304688, -0.09466552734375, -0.09038162231445312, -0.08609771728515625, -0.08181381225585938, -0.0775299072265625, -0.07324600219726562, -0.06896209716796875, -0.06467819213867188, -0.060394287109375, -0.056110382080078125, -0.05182647705078125, -0.047542572021484375, -0.0432586669921875, -0.038974761962890625, -0.03469085693359375, -0.030406951904296875, -0.026123046875, -0.021839141845703125, -0.01755523681640625, -0.013271331787109375, -0.0089874267578125, -0.004703521728515625, -0.00041961669921875, 0.003864288330078125, 0.008148193359375, 0.012432098388671875, 0.01671600341796875, 0.020999908447265625, 0.0252838134765625, 0.029567718505859375, 0.03385162353515625, 0.038135528564453125, 0.04241943359375, 0.046703338623046875, 0.05098724365234375, 0.055271148681640625, 0.0595550537109375, 0.06383895874023438, 0.06812286376953125, 0.07240676879882812, 0.076690673828125, 0.08097457885742188, 0.08525848388671875, 0.08954238891601562, 0.0938262939453125, 0.09811019897460938, 0.10239410400390625, 0.10667800903320312, 0.1109619140625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 7.0, 5.0, 9.0, 8.0, 20.0, 21.0, 42.0, 58.0, 149.0, 390.0, 1651.0, 12918.0, 3715095.0, 455434.0, 6872.0, 1037.0, 275.0, 90.0, 55.0, 34.0, 26.0, 18.0, 14.0, 6.0, 6.0, 5.0, 5.0, 5.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-1.58203125, -1.5272674560546875, -1.472503662109375, -1.4177398681640625, -1.36297607421875, -1.3082122802734375, -1.253448486328125, -1.1986846923828125, -1.1439208984375, -1.0891571044921875, -1.034393310546875, -0.9796295166015625, -0.92486572265625, -0.8701019287109375, -0.815338134765625, -0.7605743408203125, -0.705810546875, -0.6510467529296875, -0.596282958984375, -0.5415191650390625, -0.48675537109375, -0.4319915771484375, -0.377227783203125, -0.3224639892578125, -0.2677001953125, -0.2129364013671875, -0.158172607421875, -0.1034088134765625, -0.04864501953125, 0.0061187744140625, 0.060882568359375, 0.1156463623046875, 0.17041015625, 0.2251739501953125, 0.279937744140625, 0.3347015380859375, 0.38946533203125, 0.4442291259765625, 0.498992919921875, 0.5537567138671875, 0.6085205078125, 0.6632843017578125, 0.718048095703125, 0.7728118896484375, 0.82757568359375, 0.8823394775390625, 0.937103271484375, 0.9918670654296875, 1.046630859375, 1.1013946533203125, 1.156158447265625, 1.2109222412109375, 1.26568603515625, 1.3204498291015625, 1.375213623046875, 1.4299774169921875, 1.4847412109375, 1.5395050048828125, 1.594268798828125, 1.6490325927734375, 1.70379638671875, 1.7585601806640625, 1.813323974609375, 1.8680877685546875, 1.9228515625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 3.0, 5.0, 4.0, 5.0, 9.0, 19.0, 28.0, 27.0, 30.0, 52.0, 80.0, 147.0, 248.0, 524.0, 1424.0, 725.0, 294.0, 164.0, 96.0, 42.0, 28.0, 35.0, 15.0, 15.0, 8.0, 6.0, 3.0, 5.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.13720703125, -0.13335227966308594, -0.12949752807617188, -0.1256427764892578, -0.12178802490234375, -0.11793327331542969, -0.11407852172851562, -0.11022377014160156, -0.1063690185546875, -0.10251426696777344, -0.09865951538085938, -0.09480476379394531, -0.09095001220703125, -0.08709526062011719, -0.08324050903320312, -0.07938575744628906, -0.075531005859375, -0.07167625427246094, -0.06782150268554688, -0.06396675109863281, -0.06011199951171875, -0.05625724792480469, -0.052402496337890625, -0.04854774475097656, -0.0446929931640625, -0.04083824157714844, -0.036983489990234375, -0.03312873840332031, -0.02927398681640625, -0.025419235229492188, -0.021564483642578125, -0.017709732055664062, -0.01385498046875, -0.010000228881835938, -0.006145477294921875, -0.0022907257080078125, 0.00156402587890625, 0.0054187774658203125, 0.009273529052734375, 0.013128280639648438, 0.0169830322265625, 0.020837783813476562, 0.024692535400390625, 0.028547286987304688, 0.03240203857421875, 0.03625679016113281, 0.040111541748046875, 0.04396629333496094, 0.047821044921875, 0.05167579650878906, 0.055530548095703125, 0.05938529968261719, 0.06324005126953125, 0.06709480285644531, 0.07094955444335938, 0.07480430603027344, 0.0786590576171875, 0.08251380920410156, 0.08636856079101562, 0.09022331237792969, 0.09407806396484375, 0.09793281555175781, 0.10178756713867188, 0.10564231872558594, 0.1094970703125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 11.0, 21.0, 100.0, 332.0, 404.0, 102.0, 22.0, 1.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4085204601287842, -1.363159418106079, -1.317798376083374, -1.2724374532699585, -1.2270764112472534, -1.1817153692245483, -1.1363543272018433, -1.0909934043884277, -1.0456323623657227, -1.0002713203430176, -0.9549103379249573, -0.9095492959022522, -0.8641883134841919, -0.8188272714614868, -0.7734662294387817, -0.7281052470207214, -0.6827442049980164, -0.6373831629753113, -0.592022180557251, -0.5466611385345459, -0.5013001561164856, -0.4559391140937805, -0.4105781018733978, -0.36521708965301514, -0.31985607743263245, -0.27449506521224976, -0.22913405299186707, -0.18377302587032318, -0.1384120136499405, -0.0930510014295578, -0.047689974308013916, -0.0023289620876312256, 0.043032050132751465, 0.08839306235313416, 0.13375407457351685, 0.17911510169506073, 0.22447611391544342, 0.2698371410369873, 0.31519815325737, 0.3605591654777527, 0.4059201776981354, 0.45128118991851807, 0.49664220213890076, 0.5420032143592834, 0.5873642563819885, 0.6327252388000488, 0.6780862808227539, 0.723447322845459, 0.7688083052635193, 0.8141693472862244, 0.8595303297042847, 0.9048913717269897, 0.95025235414505, 0.9956133961677551, 1.0409743785858154, 1.0863354206085205, 1.1316964626312256, 1.1770575046539307, 1.2224185466766357, 1.2677794694900513, 1.3131405115127563, 1.3585015535354614, 1.4038625955581665, 1.449223518371582, 1.494584560394287]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 2.0, 2.0, 4.0, 1.0, 2.0, 6.0, 3.0, 5.0, 4.0, 6.0, 11.0, 19.0, 19.0, 41.0, 36.0, 28.0, 54.0, 55.0, 59.0, 62.0, 76.0, 69.0, 66.0, 63.0, 65.0, 58.0, 53.0, 28.0, 21.0, 25.0, 13.0, 14.0, 7.0, 5.0, 5.0, 2.0, 4.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.6968783736228943, -0.6789629459381104, -0.6610474586486816, -0.6431320309638977, -0.625216543674469, -0.6073011159896851, -0.5893856287002563, -0.5714702010154724, -0.5535547733306885, -0.5356393456459045, -0.5177238583564758, -0.4998084008693695, -0.4818929433822632, -0.46397751569747925, -0.4460620582103729, -0.4281466007232666, -0.4102311134338379, -0.39231565594673157, -0.37440019845962524, -0.3564847409725189, -0.3385692834854126, -0.32065385580062866, -0.30273839831352234, -0.284822940826416, -0.2669074833393097, -0.24899202585220337, -0.23107656836509705, -0.21316112577915192, -0.1952456682920456, -0.17733021080493927, -0.15941476821899414, -0.14149931073188782, -0.1235838532447815, -0.10566839575767517, -0.08775294572114944, -0.06983749568462372, -0.051922038197517395, -0.03400658071041107, -0.016091130673885345, 0.0018243193626403809, 0.019739776849746704, 0.03765523061156273, 0.055570684373378754, 0.07348613440990448, 0.0914015918970108, 0.10931704938411713, 0.12723249197006226, 0.14514794945716858, 0.1630634069442749, 0.18097886443138123, 0.19889432191848755, 0.21680976450443268, 0.234725221991539, 0.25264066457748413, 0.27055612206459045, 0.2884715795516968, 0.3063870370388031, 0.3243024945259094, 0.34221795201301575, 0.36013340950012207, 0.378048837184906, 0.3959643244743347, 0.41387975215911865, 0.431795209646225, 0.4497106671333313]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 8.0, 8.0, 14.0, 19.0, 30.0, 28.0, 51.0, 102.0, 169.0, 281.0, 522.0, 1119.0, 3155.0, 13213.0, 272523.0, 728066.0, 22177.0, 4185.0, 1431.0, 653.0, 316.0, 176.0, 113.0, 70.0, 39.0, 32.0, 13.0, 12.0, 3.0, 11.0, 3.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.95751953125, -0.9246444702148438, -0.8917694091796875, -0.8588943481445312, -0.826019287109375, -0.7931442260742188, -0.7602691650390625, -0.7273941040039062, -0.69451904296875, -0.6616439819335938, -0.6287689208984375, -0.5958938598632812, -0.563018798828125, -0.5301437377929688, -0.4972686767578125, -0.46439361572265625, -0.4315185546875, -0.39864349365234375, -0.3657684326171875, -0.33289337158203125, -0.300018310546875, -0.26714324951171875, -0.2342681884765625, -0.20139312744140625, -0.16851806640625, -0.13564300537109375, -0.1027679443359375, -0.06989288330078125, -0.037017822265625, -0.00414276123046875, 0.0287322998046875, 0.06160736083984375, 0.094482421875, 0.12735748291015625, 0.1602325439453125, 0.19310760498046875, 0.225982666015625, 0.25885772705078125, 0.2917327880859375, 0.32460784912109375, 0.35748291015625, 0.39035797119140625, 0.4232330322265625, 0.45610809326171875, 0.488983154296875, 0.5218582153320312, 0.5547332763671875, 0.5876083374023438, 0.6204833984375, 0.6533584594726562, 0.6862335205078125, 0.7191085815429688, 0.751983642578125, 0.7848587036132812, 0.8177337646484375, 0.8506088256835938, 0.88348388671875, 0.9163589477539062, 0.9492340087890625, 0.9821090698242188, 1.014984130859375, 1.0478591918945312, 1.0807342529296875, 1.1136093139648438, 1.146484375]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 7.0, 5.0, 4.0, 11.0, 18.0, 52.0, 102.0, 191.0, 225.0, 176.0, 98.0, 49.0, 19.0, 15.0, 10.0, 6.0, 4.0, 1.0, 4.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.15576171875, -0.15161991119384766, -0.1474781036376953, -0.14333629608154297, -0.13919448852539062, -0.13505268096923828, -0.13091087341308594, -0.1267690658569336, -0.12262725830078125, -0.1184854507446289, -0.11434364318847656, -0.11020183563232422, -0.10606002807617188, -0.10191822052001953, -0.09777641296386719, -0.09363460540771484, -0.0894927978515625, -0.08535099029541016, -0.08120918273925781, -0.07706737518310547, -0.07292556762695312, -0.06878376007080078, -0.06464195251464844, -0.060500144958496094, -0.05635833740234375, -0.052216529846191406, -0.04807472229003906, -0.04393291473388672, -0.039791107177734375, -0.03564929962158203, -0.03150749206542969, -0.027365684509277344, -0.023223876953125, -0.019082069396972656, -0.014940261840820312, -0.010798454284667969, -0.006656646728515625, -0.0025148391723632812, 0.0016269683837890625, 0.005768775939941406, 0.00991058349609375, 0.014052391052246094, 0.018194198608398438, 0.02233600616455078, 0.026477813720703125, 0.03061962127685547, 0.03476142883300781, 0.038903236389160156, 0.0430450439453125, 0.047186851501464844, 0.05132865905761719, 0.05547046661376953, 0.059612274169921875, 0.06375408172607422, 0.06789588928222656, 0.0720376968383789, 0.07617950439453125, 0.0803213119506836, 0.08446311950683594, 0.08860492706298828, 0.09274673461914062, 0.09688854217529297, 0.10103034973144531, 0.10517215728759766, 0.10931396484375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 7.0, 5.0, 8.0, 8.0, 21.0, 17.0, 25.0, 40.0, 64.0, 87.0, 120.0, 183.0, 245.0, 463.0, 969.0, 2340.0, 6900.0, 26678.0, 151294.0, 621509.0, 192212.0, 32352.0, 7877.0, 2597.0, 1097.0, 514.0, 316.0, 202.0, 117.0, 89.0, 54.0, 46.0, 21.0, 28.0, 19.0, 8.0, 7.0, 6.0, 1.0, 4.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.48779296875, -0.4723358154296875, -0.456878662109375, -0.4414215087890625, -0.42596435546875, -0.4105072021484375, -0.395050048828125, -0.3795928955078125, -0.3641357421875, -0.3486785888671875, -0.333221435546875, -0.3177642822265625, -0.30230712890625, -0.2868499755859375, -0.271392822265625, -0.2559356689453125, -0.240478515625, -0.2250213623046875, -0.209564208984375, -0.1941070556640625, -0.17864990234375, -0.1631927490234375, -0.147735595703125, -0.1322784423828125, -0.1168212890625, -0.1013641357421875, -0.085906982421875, -0.0704498291015625, -0.05499267578125, -0.0395355224609375, -0.024078369140625, -0.0086212158203125, 0.0068359375, 0.0222930908203125, 0.037750244140625, 0.0532073974609375, 0.06866455078125, 0.0841217041015625, 0.099578857421875, 0.1150360107421875, 0.1304931640625, 0.1459503173828125, 0.161407470703125, 0.1768646240234375, 0.19232177734375, 0.2077789306640625, 0.223236083984375, 0.2386932373046875, 0.254150390625, 0.2696075439453125, 0.285064697265625, 0.3005218505859375, 0.31597900390625, 0.3314361572265625, 0.346893310546875, 0.3623504638671875, 0.3778076171875, 0.3932647705078125, 0.408721923828125, 0.4241790771484375, 0.43963623046875, 0.4550933837890625, 0.470550537109375, 0.4860076904296875, 0.50146484375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 5.0, 2.0, 5.0, 5.0, 10.0, 10.0, 8.0, 13.0, 18.0, 15.0, 20.0, 19.0, 27.0, 41.0, 39.0, 33.0, 46.0, 63.0, 54.0, 48.0, 54.0, 52.0, 61.0, 50.0, 42.0, 42.0, 37.0, 32.0, 25.0, 27.0, 17.0, 23.0, 8.0, 13.0, 11.0, 7.0, 6.0, 6.0, 3.0, 7.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33544921875, -0.324310302734375, -0.31317138671875, -0.302032470703125, -0.2908935546875, -0.279754638671875, -0.26861572265625, -0.257476806640625, -0.246337890625, -0.235198974609375, -0.22406005859375, -0.212921142578125, -0.2017822265625, -0.190643310546875, -0.17950439453125, -0.168365478515625, -0.1572265625, -0.146087646484375, -0.13494873046875, -0.123809814453125, -0.1126708984375, -0.101531982421875, -0.09039306640625, -0.079254150390625, -0.068115234375, -0.056976318359375, -0.04583740234375, -0.034698486328125, -0.0235595703125, -0.012420654296875, -0.00128173828125, 0.009857177734375, 0.02099609375, 0.032135009765625, 0.04327392578125, 0.054412841796875, 0.0655517578125, 0.076690673828125, 0.08782958984375, 0.098968505859375, 0.110107421875, 0.121246337890625, 0.13238525390625, 0.143524169921875, 0.1546630859375, 0.165802001953125, 0.17694091796875, 0.188079833984375, 0.19921875, 0.210357666015625, 0.22149658203125, 0.232635498046875, 0.2437744140625, 0.254913330078125, 0.26605224609375, 0.277191162109375, 0.288330078125, 0.299468994140625, 0.31060791015625, 0.321746826171875, 0.3328857421875, 0.344024658203125, 0.35516357421875, 0.366302490234375, 0.37744140625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 4.0, 6.0, 10.0, 12.0, 23.0, 31.0, 46.0, 87.0, 114.0, 205.0, 489.0, 1186.0, 4336.0, 23151.0, 259922.0, 681340.0, 65290.0, 8715.0, 2122.0, 716.0, 311.0, 156.0, 105.0, 57.0, 40.0, 23.0, 19.0, 11.0, 8.0, 8.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3349609375, -0.32488250732421875, -0.3148040771484375, -0.30472564697265625, -0.294647216796875, -0.28456878662109375, -0.2744903564453125, -0.26441192626953125, -0.25433349609375, -0.24425506591796875, -0.2341766357421875, -0.22409820556640625, -0.214019775390625, -0.20394134521484375, -0.1938629150390625, -0.18378448486328125, -0.1737060546875, -0.16362762451171875, -0.1535491943359375, -0.14347076416015625, -0.133392333984375, -0.12331390380859375, -0.1132354736328125, -0.10315704345703125, -0.09307861328125, -0.08300018310546875, -0.0729217529296875, -0.06284332275390625, -0.052764892578125, -0.04268646240234375, -0.0326080322265625, -0.02252960205078125, -0.012451171875, -0.00237274169921875, 0.0077056884765625, 0.01778411865234375, 0.027862548828125, 0.03794097900390625, 0.0480194091796875, 0.05809783935546875, 0.06817626953125, 0.07825469970703125, 0.0883331298828125, 0.09841156005859375, 0.108489990234375, 0.11856842041015625, 0.1286468505859375, 0.13872528076171875, 0.1488037109375, 0.15888214111328125, 0.1689605712890625, 0.17903900146484375, 0.189117431640625, 0.19919586181640625, 0.2092742919921875, 0.21935272216796875, 0.22943115234375, 0.23950958251953125, 0.2495880126953125, 0.25966644287109375, 0.269744873046875, 0.27982330322265625, 0.2899017333984375, 0.29998016357421875, 0.31005859375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 7.0, 8.0, 5.0, 15.0, 15.0, 14.0, 32.0, 50.0, 50.0, 74.0, 134.0, 176.0, 140.0, 84.0, 55.0, 31.0, 35.0, 23.0, 24.0, 14.0, 10.0, 7.0, 6.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002474784851074219, -0.00024164840579032898, -0.00023581832647323608, -0.0002299882471561432, -0.0002241581678390503, -0.0002183280885219574, -0.0002124980092048645, -0.0002066679298877716, -0.0002008378505706787, -0.00019500777125358582, -0.00018917769193649292, -0.00018334761261940002, -0.00017751753330230713, -0.00017168745398521423, -0.00016585737466812134, -0.00016002729535102844, -0.00015419721603393555, -0.00014836713671684265, -0.00014253705739974976, -0.00013670697808265686, -0.00013087689876556396, -0.00012504681944847107, -0.00011921674013137817, -0.00011338666081428528, -0.00010755658149719238, -0.00010172650218009949, -9.589642286300659e-05, -9.00663435459137e-05, -8.42362642288208e-05, -7.84061849117279e-05, -7.257610559463501e-05, -6.674602627754211e-05, -6.091594696044922e-05, -5.508586764335632e-05, -4.925578832626343e-05, -4.342570900917053e-05, -3.759562969207764e-05, -3.176555037498474e-05, -2.5935471057891846e-05, -2.010539174079895e-05, -1.4275312423706055e-05, -8.44523310661316e-06, -2.6151537895202637e-06, 3.214925527572632e-06, 9.045004844665527e-06, 1.4875084161758423e-05, 2.070516347885132e-05, 2.6535242795944214e-05, 3.236532211303711e-05, 3.8195401430130005e-05, 4.40254807472229e-05, 4.9855560064315796e-05, 5.568563938140869e-05, 6.151571869850159e-05, 6.734579801559448e-05, 7.317587733268738e-05, 7.900595664978027e-05, 8.483603596687317e-05, 9.066611528396606e-05, 9.649619460105896e-05, 0.00010232627391815186, 0.00010815635323524475, 0.00011398643255233765, 0.00011981651186943054, 0.00012564659118652344]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 2.0, 7.0, 1.0, 5.0, 7.0, 7.0, 14.0, 22.0, 26.0, 26.0, 35.0, 59.0, 73.0, 151.0, 235.0, 533.0, 1125.0, 3319.0, 13766.0, 92129.0, 688381.0, 215200.0, 25504.0, 5009.0, 1522.0, 600.0, 329.0, 155.0, 90.0, 66.0, 46.0, 25.0, 14.0, 18.0, 16.0, 12.0, 7.0, 2.0, 6.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33154296875, -0.3222503662109375, -0.312957763671875, -0.3036651611328125, -0.29437255859375, -0.2850799560546875, -0.275787353515625, -0.2664947509765625, -0.2572021484375, -0.2479095458984375, -0.238616943359375, -0.2293243408203125, -0.22003173828125, -0.2107391357421875, -0.201446533203125, -0.1921539306640625, -0.182861328125, -0.1735687255859375, -0.164276123046875, -0.1549835205078125, -0.14569091796875, -0.1363983154296875, -0.127105712890625, -0.1178131103515625, -0.1085205078125, -0.0992279052734375, -0.089935302734375, -0.0806427001953125, -0.07135009765625, -0.0620574951171875, -0.052764892578125, -0.0434722900390625, -0.0341796875, -0.0248870849609375, -0.015594482421875, -0.0063018798828125, 0.00299072265625, 0.0122833251953125, 0.021575927734375, 0.0308685302734375, 0.0401611328125, 0.0494537353515625, 0.058746337890625, 0.0680389404296875, 0.07733154296875, 0.0866241455078125, 0.095916748046875, 0.1052093505859375, 0.114501953125, 0.1237945556640625, 0.133087158203125, 0.1423797607421875, 0.15167236328125, 0.1609649658203125, 0.170257568359375, 0.1795501708984375, 0.1888427734375, 0.1981353759765625, 0.207427978515625, 0.2167205810546875, 0.22601318359375, 0.2353057861328125, 0.244598388671875, 0.2538909912109375, 0.26318359375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 9.0, 5.0, 13.0, 5.0, 9.0, 26.0, 33.0, 32.0, 42.0, 63.0, 66.0, 82.0, 97.0, 79.0, 93.0, 58.0, 70.0, 43.0, 43.0, 25.0, 27.0, 18.0, 12.0, 11.0, 7.0, 12.0, 4.0, 2.0, 3.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1650390625, -0.16072750091552734, -0.1564159393310547, -0.15210437774658203, -0.14779281616210938, -0.14348125457763672, -0.13916969299316406, -0.1348581314086914, -0.13054656982421875, -0.1262350082397461, -0.12192344665527344, -0.11761188507080078, -0.11330032348632812, -0.10898876190185547, -0.10467720031738281, -0.10036563873291016, -0.0960540771484375, -0.09174251556396484, -0.08743095397949219, -0.08311939239501953, -0.07880783081054688, -0.07449626922607422, -0.07018470764160156, -0.0658731460571289, -0.06156158447265625, -0.057250022888183594, -0.05293846130371094, -0.04862689971923828, -0.044315338134765625, -0.04000377655029297, -0.03569221496582031, -0.031380653381347656, -0.027069091796875, -0.022757530212402344, -0.018445968627929688, -0.014134407043457031, -0.009822845458984375, -0.005511283874511719, -0.0011997222900390625, 0.0031118392944335938, 0.00742340087890625, 0.011734962463378906, 0.016046524047851562, 0.02035808563232422, 0.024669647216796875, 0.02898120880126953, 0.03329277038574219, 0.037604331970214844, 0.0419158935546875, 0.046227455139160156, 0.05053901672363281, 0.05485057830810547, 0.059162139892578125, 0.06347370147705078, 0.06778526306152344, 0.0720968246459961, 0.07640838623046875, 0.0807199478149414, 0.08503150939941406, 0.08934307098388672, 0.09365463256835938, 0.09796619415283203, 0.10227775573730469, 0.10658931732177734, 0.11090087890625]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 6.0, 2.0, 6.0, 17.0, 32.0, 86.0, 286.0, 372.0, 137.0, 44.0, 10.0, 5.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6822969913482666, -3.4905805587768555, -3.2988638877868652, -3.107147216796875, -2.915430784225464, -2.7237143516540527, -2.5319976806640625, -2.3402810096740723, -2.148564577102661, -1.9568480253219604, -1.7651314735412598, -1.573414921760559, -1.3816983699798584, -1.1899818181991577, -0.998265266418457, -0.8065487146377563, -0.6148321628570557, -0.423115611076355, -0.2313990592956543, -0.03968250751495361, 0.15203404426574707, 0.34375059604644775, 0.5354671478271484, 0.7271836996078491, 0.9189002513885498, 1.1106168031692505, 1.3023333549499512, 1.4940499067306519, 1.6857664585113525, 1.8774830102920532, 2.069199562072754, 2.260916233062744, 2.4526329040527344, 2.6443495750427246, 2.8360660076141357, 3.027782440185547, 3.219499111175537, 3.4112157821655273, 3.6029322147369385, 3.7946486473083496, 3.98636531829834, 4.17808198928833, 4.36979866027832, 4.561514854431152, 4.753231525421143, 4.944948196411133, 5.136664390563965, 5.328381061553955, 5.520097732543945, 5.7118144035339355, 5.903531074523926, 6.095247268676758, 6.286963939666748, 6.478680610656738, 6.67039680480957, 6.8621134757995605, 7.053830146789551, 7.245546817779541, 7.437263488769531, 7.628979682922363, 7.8206963539123535, 8.012413024902344, 8.204129219055176, 8.395846366882324, 8.587562561035156]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 2.0, 8.0, 6.0, 13.0, 17.0, 16.0, 22.0, 20.0, 30.0, 38.0, 46.0, 41.0, 49.0, 46.0, 49.0, 64.0, 68.0, 79.0, 39.0, 52.0, 58.0, 53.0, 41.0, 23.0, 26.0, 26.0, 20.0, 10.0, 11.0, 10.0, 6.0, 5.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6003174781799316, -2.4959962368011475, -2.3916749954223633, -2.287353992462158, -2.183032751083374, -2.07871150970459, -1.9743902683258057, -1.8700690269470215, -1.7657477855682373, -1.6614265441894531, -1.5571054220199585, -1.4527841806411743, -1.3484629392623901, -1.2441418170928955, -1.1398205757141113, -1.0354993343353271, -0.9311782121658325, -0.8268570303916931, -0.7225357890129089, -0.6182146072387695, -0.5138933658599854, -0.40957218408584595, -0.30525100231170654, -0.20092976093292236, -0.09660857915878296, 0.007712624967098236, 0.11203382909297943, 0.21635502576828003, 0.3206762373447418, 0.4249974489212036, 0.529318630695343, 0.6336398720741272, 0.7379610538482666, 0.842282235622406, 0.9466034770011902, 1.0509246587753296, 1.1552459001541138, 1.2595670223236084, 1.3638882637023926, 1.4682095050811768, 1.572530746459961, 1.6768519878387451, 1.7811731100082397, 1.885494351387024, 1.989815592765808, 2.0941367149353027, 2.198457956314087, 2.302779197692871, 2.407100200653076, 2.5114214420318604, 2.6157426834106445, 2.7200636863708496, 2.824384927749634, 2.928706169128418, 3.033027410507202, 3.1373486518859863, 3.2416698932647705, 3.3459911346435547, 3.450312376022339, 3.554633617401123, 3.658954620361328, 3.7632758617401123, 3.8675971031188965, 3.9719183444976807, 4.076239585876465]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 8.0, 8.0, 22.0, 23.0, 42.0, 87.0, 182.0, 572.0, 4551.0, 4148468.0, 38198.0, 1498.0, 359.0, 119.0, 70.0, 34.0, 18.0, 7.0, 6.0, 6.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.71484375, -5.559326171875, -5.40380859375, -5.248291015625, -5.0927734375, -4.937255859375, -4.78173828125, -4.626220703125, -4.470703125, -4.315185546875, -4.15966796875, -4.004150390625, -3.8486328125, -3.693115234375, -3.53759765625, -3.382080078125, -3.2265625, -3.071044921875, -2.91552734375, -2.760009765625, -2.6044921875, -2.448974609375, -2.29345703125, -2.137939453125, -1.982421875, -1.826904296875, -1.67138671875, -1.515869140625, -1.3603515625, -1.204833984375, -1.04931640625, -0.893798828125, -0.73828125, -0.582763671875, -0.42724609375, -0.271728515625, -0.1162109375, 0.039306640625, 0.19482421875, 0.350341796875, 0.505859375, 0.661376953125, 0.81689453125, 0.972412109375, 1.1279296875, 1.283447265625, 1.43896484375, 1.594482421875, 1.75, 1.905517578125, 2.06103515625, 2.216552734375, 2.3720703125, 2.527587890625, 2.68310546875, 2.838623046875, 2.994140625, 3.149658203125, 3.30517578125, 3.460693359375, 3.6162109375, 3.771728515625, 3.92724609375, 4.082763671875, 4.23828125]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 7.0, 17.0, 19.0, 36.0, 76.0, 109.0, 159.0, 161.0, 145.0, 107.0, 62.0, 43.0, 21.0, 19.0, 4.0, 5.0, 1.0, 5.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1905517578125, -0.1853351593017578, -0.18011856079101562, -0.17490196228027344, -0.16968536376953125, -0.16446876525878906, -0.15925216674804688, -0.1540355682373047, -0.1488189697265625, -0.1436023712158203, -0.13838577270507812, -0.13316917419433594, -0.12795257568359375, -0.12273597717285156, -0.11751937866210938, -0.11230278015136719, -0.107086181640625, -0.10186958312988281, -0.09665298461914062, -0.09143638610839844, -0.08621978759765625, -0.08100318908691406, -0.07578659057617188, -0.07056999206542969, -0.0653533935546875, -0.06013679504394531, -0.054920196533203125, -0.04970359802246094, -0.04448699951171875, -0.03927040100097656, -0.034053802490234375, -0.028837203979492188, -0.02362060546875, -0.018404006958007812, -0.013187408447265625, -0.007970809936523438, -0.00275421142578125, 0.0024623870849609375, 0.007678985595703125, 0.012895584106445312, 0.0181121826171875, 0.023328781127929688, 0.028545379638671875, 0.03376197814941406, 0.03897857666015625, 0.04419517517089844, 0.049411773681640625, 0.05462837219238281, 0.059844970703125, 0.06506156921386719, 0.07027816772460938, 0.07549476623535156, 0.08071136474609375, 0.08592796325683594, 0.09114456176757812, 0.09636116027832031, 0.1015777587890625, 0.10679435729980469, 0.11201095581054688, 0.11722755432128906, 0.12244415283203125, 0.12766075134277344, 0.13287734985351562, 0.1380939483642578, 0.143310546875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 5.0, 11.0, 17.0, 15.0, 11.0, 31.0, 41.0, 65.0, 88.0, 172.0, 320.0, 632.0, 2021.0, 8724.0, 84710.0, 3814387.0, 261276.0, 17020.0, 3038.0, 890.0, 384.0, 176.0, 98.0, 58.0, 36.0, 18.0, 13.0, 9.0, 7.0, 6.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.775390625, -0.7492446899414062, -0.7230987548828125, -0.6969528198242188, -0.670806884765625, -0.6446609497070312, -0.6185150146484375, -0.5923690795898438, -0.56622314453125, -0.5400772094726562, -0.5139312744140625, -0.48778533935546875, -0.461639404296875, -0.43549346923828125, -0.4093475341796875, -0.38320159912109375, -0.3570556640625, -0.33090972900390625, -0.3047637939453125, -0.27861785888671875, -0.252471923828125, -0.22632598876953125, -0.2001800537109375, -0.17403411865234375, -0.14788818359375, -0.12174224853515625, -0.0955963134765625, -0.06945037841796875, -0.043304443359375, -0.01715850830078125, 0.0089874267578125, 0.03513336181640625, 0.061279296875, 0.08742523193359375, 0.1135711669921875, 0.13971710205078125, 0.165863037109375, 0.19200897216796875, 0.2181549072265625, 0.24430084228515625, 0.27044677734375, 0.29659271240234375, 0.3227386474609375, 0.34888458251953125, 0.375030517578125, 0.40117645263671875, 0.4273223876953125, 0.45346832275390625, 0.4796142578125, 0.5057601928710938, 0.5319061279296875, 0.5580520629882812, 0.584197998046875, 0.6103439331054688, 0.6364898681640625, 0.6626358032226562, 0.68878173828125, 0.7149276733398438, 0.7410736083984375, 0.7672195434570312, 0.793365478515625, 0.8195114135742188, 0.8456573486328125, 0.8718032836914062, 0.89794921875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 4.0, 8.0, 10.0, 11.0, 18.0, 40.0, 56.0, 94.0, 167.0, 364.0, 1141.0, 1254.0, 431.0, 189.0, 95.0, 62.0, 37.0, 30.0, 18.0, 13.0, 15.0, 5.0, 2.0, 7.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.22412109375, -0.2185192108154297, -0.21291732788085938, -0.20731544494628906, -0.20171356201171875, -0.19611167907714844, -0.19050979614257812, -0.1849079132080078, -0.1793060302734375, -0.1737041473388672, -0.16810226440429688, -0.16250038146972656, -0.15689849853515625, -0.15129661560058594, -0.14569473266601562, -0.1400928497314453, -0.134490966796875, -0.1288890838623047, -0.12328720092773438, -0.11768531799316406, -0.11208343505859375, -0.10648155212402344, -0.10087966918945312, -0.09527778625488281, -0.0896759033203125, -0.08407402038574219, -0.07847213745117188, -0.07287025451660156, -0.06726837158203125, -0.06166648864746094, -0.056064605712890625, -0.05046272277832031, -0.04486083984375, -0.03925895690917969, -0.033657073974609375, -0.028055191040039062, -0.02245330810546875, -0.016851425170898438, -0.011249542236328125, -0.0056476593017578125, -4.57763671875e-05, 0.0055561065673828125, 0.011157989501953125, 0.016759872436523438, 0.02236175537109375, 0.027963638305664062, 0.033565521240234375, 0.03916740417480469, 0.044769287109375, 0.05037117004394531, 0.055973052978515625, 0.06157493591308594, 0.06717681884765625, 0.07277870178222656, 0.07838058471679688, 0.08398246765136719, 0.0895843505859375, 0.09518623352050781, 0.10078811645507812, 0.10638999938964844, 0.11199188232421875, 0.11759376525878906, 0.12319564819335938, 0.1287975311279297, 0.1343994140625]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 7.0, 12.0, 33.0, 117.0, 303.0, 340.0, 134.0, 35.0, 10.0, 8.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0341618061065674, -1.988869547843933, -1.9435774087905884, -1.898285150527954, -1.8529930114746094, -1.807700753211975, -1.7624086141586304, -1.717116355895996, -1.6718242168426514, -1.626531958580017, -1.5812398195266724, -1.535947561264038, -1.4906554222106934, -1.445363163948059, -1.4000710248947144, -1.35477876663208, -1.3094866275787354, -1.264194369316101, -1.2189022302627563, -1.173609972000122, -1.1283178329467773, -1.083025574684143, -1.0377334356307983, -0.9924411773681641, -0.9471489191055298, -0.9018567204475403, -0.8565645217895508, -0.8112723231315613, -0.7659801244735718, -0.7206879258155823, -0.6753957271575928, -0.6301034688949585, -0.5848113298416138, -0.5395191311836243, -0.49422693252563477, -0.44893473386764526, -0.40364253520965576, -0.35835033655166626, -0.31305810809135437, -0.26776590943336487, -0.22247371077537537, -0.17718151211738586, -0.13188931345939636, -0.08659709990024567, -0.041304901242256165, 0.003987297415733337, 0.04927951097488403, 0.09457170963287354, 0.13986390829086304, 0.18515610694885254, 0.23044830560684204, 0.27574050426483154, 0.32103270292282104, 0.36632490158081055, 0.41161713004112244, 0.45690932869911194, 0.5022015571594238, 0.5474937558174133, 0.5927859544754028, 0.6380781531333923, 0.6833703517913818, 0.7286625504493713, 0.7739547491073608, 0.8192470073699951, 0.8645391464233398]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 10.0, 11.0, 10.0, 11.0, 28.0, 16.0, 22.0, 41.0, 42.0, 34.0, 34.0, 45.0, 48.0, 49.0, 51.0, 49.0, 60.0, 57.0, 54.0, 55.0, 38.0, 44.0, 29.0, 31.0, 21.0, 21.0, 19.0, 12.0, 14.0, 12.0, 9.0, 1.0, 7.0, 4.0, 6.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.5313940644264221, -0.5143440961837769, -0.4972941279411316, -0.4802441895008087, -0.46319422125816345, -0.4461442530155182, -0.4290943145751953, -0.41204434633255005, -0.3949943780899048, -0.3779444098472595, -0.36089444160461426, -0.3438445031642914, -0.3267945349216461, -0.30974456667900085, -0.292694628238678, -0.2756446599960327, -0.25859469175338745, -0.2415447235107422, -0.22449477016925812, -0.20744481682777405, -0.19039484858512878, -0.17334488034248352, -0.15629492700099945, -0.13924497365951538, -0.12219500541687012, -0.10514504462480545, -0.08809508383274078, -0.07104512304067612, -0.05399516224861145, -0.03694520145654678, -0.019895240664482117, -0.00284527987241745, 0.014204680919647217, 0.031254641711711884, 0.04830460250377655, 0.06535456329584122, 0.08240452408790588, 0.09945448487997055, 0.11650444567203522, 0.1335543990135193, 0.15060436725616455, 0.16765433549880981, 0.18470428884029388, 0.20175424218177795, 0.21880421042442322, 0.23585417866706848, 0.25290411710739136, 0.2699540853500366, 0.2870040535926819, 0.30405402183532715, 0.3211039900779724, 0.3381539285182953, 0.35520389676094055, 0.3722538650035858, 0.3893038034439087, 0.40635377168655396, 0.4234037399291992, 0.4404537081718445, 0.45750367641448975, 0.4745536148548126, 0.4916035830974579, 0.5086535215377808, 0.525703489780426, 0.5427534580230713, 0.5598034262657166]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 6.0, 6.0, 7.0, 12.0, 17.0, 25.0, 39.0, 72.0, 144.0, 209.0, 439.0, 1016.0, 2747.0, 12341.0, 316963.0, 687017.0, 21328.0, 3704.0, 1293.0, 566.0, 259.0, 116.0, 78.0, 54.0, 25.0, 25.0, 11.0, 11.0, 9.0, 6.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.12890625, -1.094818115234375, -1.06072998046875, -1.026641845703125, -0.9925537109375, -0.958465576171875, -0.92437744140625, -0.890289306640625, -0.856201171875, -0.822113037109375, -0.78802490234375, -0.753936767578125, -0.7198486328125, -0.685760498046875, -0.65167236328125, -0.617584228515625, -0.58349609375, -0.549407958984375, -0.51531982421875, -0.481231689453125, -0.4471435546875, -0.413055419921875, -0.37896728515625, -0.344879150390625, -0.310791015625, -0.276702880859375, -0.24261474609375, -0.208526611328125, -0.1744384765625, -0.140350341796875, -0.10626220703125, -0.072174072265625, -0.0380859375, -0.003997802734375, 0.03009033203125, 0.064178466796875, 0.0982666015625, 0.132354736328125, 0.16644287109375, 0.200531005859375, 0.234619140625, 0.268707275390625, 0.30279541015625, 0.336883544921875, 0.3709716796875, 0.405059814453125, 0.43914794921875, 0.473236083984375, 0.50732421875, 0.541412353515625, 0.57550048828125, 0.609588623046875, 0.6436767578125, 0.677764892578125, 0.71185302734375, 0.745941162109375, 0.780029296875, 0.814117431640625, 0.84820556640625, 0.882293701171875, 0.9163818359375, 0.950469970703125, 0.98455810546875, 1.018646240234375, 1.052734375]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 7.0, 18.0, 39.0, 77.0, 104.0, 147.0, 193.0, 141.0, 106.0, 68.0, 40.0, 30.0, 10.0, 2.0, 4.0, 4.0, 2.0, 5.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.191162109375, -0.18593978881835938, -0.18071746826171875, -0.17549514770507812, -0.1702728271484375, -0.16505050659179688, -0.15982818603515625, -0.15460586547851562, -0.149383544921875, -0.14416122436523438, -0.13893890380859375, -0.13371658325195312, -0.1284942626953125, -0.12327194213867188, -0.11804962158203125, -0.11282730102539062, -0.10760498046875, -0.10238265991210938, -0.09716033935546875, -0.09193801879882812, -0.0867156982421875, -0.08149337768554688, -0.07627105712890625, -0.07104873657226562, -0.065826416015625, -0.060604095458984375, -0.05538177490234375, -0.050159454345703125, -0.0449371337890625, -0.039714813232421875, -0.03449249267578125, -0.029270172119140625, -0.0240478515625, -0.018825531005859375, -0.01360321044921875, -0.008380889892578125, -0.0031585693359375, 0.002063751220703125, 0.00728607177734375, 0.012508392333984375, 0.017730712890625, 0.022953033447265625, 0.02817535400390625, 0.033397674560546875, 0.0386199951171875, 0.043842315673828125, 0.04906463623046875, 0.054286956787109375, 0.05950927734375, 0.06473159790039062, 0.06995391845703125, 0.07517623901367188, 0.0803985595703125, 0.08562088012695312, 0.09084320068359375, 0.09606552124023438, 0.101287841796875, 0.10651016235351562, 0.11173248291015625, 0.11695480346679688, 0.1221771240234375, 0.12739944458007812, 0.13262176513671875, 0.13784408569335938, 0.14306640625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 7.0, 13.0, 11.0, 13.0, 22.0, 28.0, 46.0, 75.0, 135.0, 165.0, 292.0, 519.0, 1021.0, 2325.0, 6574.0, 22683.0, 108009.0, 539969.0, 297058.0, 49870.0, 12417.0, 3958.0, 1530.0, 761.0, 378.0, 234.0, 133.0, 87.0, 78.0, 51.0, 33.0, 24.0, 13.0, 8.0, 6.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.420654296875, -0.4049415588378906, -0.38922882080078125, -0.3735160827636719, -0.3578033447265625, -0.3420906066894531, -0.32637786865234375, -0.3106651306152344, -0.294952392578125, -0.2792396545410156, -0.26352691650390625, -0.24781417846679688, -0.2321014404296875, -0.21638870239257812, -0.20067596435546875, -0.18496322631835938, -0.16925048828125, -0.15353775024414062, -0.13782501220703125, -0.12211227416992188, -0.1063995361328125, -0.09068679809570312, -0.07497406005859375, -0.059261322021484375, -0.043548583984375, -0.027835845947265625, -0.01212310791015625, 0.003589630126953125, 0.0193023681640625, 0.035015106201171875, 0.05072784423828125, 0.06644058227539062, 0.0821533203125, 0.09786605834960938, 0.11357879638671875, 0.12929153442382812, 0.1450042724609375, 0.16071701049804688, 0.17642974853515625, 0.19214248657226562, 0.207855224609375, 0.22356796264648438, 0.23928070068359375, 0.2549934387207031, 0.2707061767578125, 0.2864189147949219, 0.30213165283203125, 0.3178443908691406, 0.33355712890625, 0.3492698669433594, 0.36498260498046875, 0.3806953430175781, 0.3964080810546875, 0.4121208190917969, 0.42783355712890625, 0.4435462951660156, 0.459259033203125, 0.4749717712402344, 0.49068450927734375, 0.5063972473144531, 0.5221099853515625, 0.5378227233886719, 0.5535354614257812, 0.5692481994628906, 0.5849609375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 2.0, 4.0, 4.0, 7.0, 15.0, 20.0, 13.0, 24.0, 23.0, 35.0, 39.0, 53.0, 42.0, 57.0, 51.0, 70.0, 66.0, 66.0, 51.0, 62.0, 59.0, 41.0, 47.0, 28.0, 25.0, 19.0, 19.0, 12.0, 15.0, 14.0, 9.0, 5.0, 4.0, 5.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.423828125, -0.40727996826171875, -0.3907318115234375, -0.37418365478515625, -0.357635498046875, -0.34108734130859375, -0.3245391845703125, -0.30799102783203125, -0.29144287109375, -0.27489471435546875, -0.2583465576171875, -0.24179840087890625, -0.225250244140625, -0.20870208740234375, -0.1921539306640625, -0.17560577392578125, -0.1590576171875, -0.14250946044921875, -0.1259613037109375, -0.10941314697265625, -0.092864990234375, -0.07631683349609375, -0.0597686767578125, -0.04322052001953125, -0.02667236328125, -0.01012420654296875, 0.0064239501953125, 0.02297210693359375, 0.039520263671875, 0.05606842041015625, 0.0726165771484375, 0.08916473388671875, 0.105712890625, 0.12226104736328125, 0.1388092041015625, 0.15535736083984375, 0.171905517578125, 0.18845367431640625, 0.2050018310546875, 0.22154998779296875, 0.23809814453125, 0.25464630126953125, 0.2711944580078125, 0.28774261474609375, 0.304290771484375, 0.32083892822265625, 0.3373870849609375, 0.35393524169921875, 0.3704833984375, 0.38703155517578125, 0.4035797119140625, 0.42012786865234375, 0.436676025390625, 0.45322418212890625, 0.4697723388671875, 0.48632049560546875, 0.50286865234375, 0.5194168090820312, 0.5359649658203125, 0.5525131225585938, 0.569061279296875, 0.5856094360351562, 0.6021575927734375, 0.6187057495117188, 0.63525390625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 3.0, 3.0, 2.0, 13.0, 17.0, 22.0, 43.0, 59.0, 122.0, 325.0, 965.0, 4850.0, 73843.0, 813265.0, 145028.0, 7971.0, 1312.0, 373.0, 167.0, 73.0, 35.0, 24.0, 15.0, 8.0, 5.0, 2.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.3955078125, -0.3849906921386719, -0.37447357177734375, -0.3639564514160156, -0.3534393310546875, -0.3429222106933594, -0.33240509033203125, -0.3218879699707031, -0.311370849609375, -0.3008537292480469, -0.29033660888671875, -0.2798194885253906, -0.2693023681640625, -0.2587852478027344, -0.24826812744140625, -0.23775100708007812, -0.22723388671875, -0.21671676635742188, -0.20619964599609375, -0.19568252563476562, -0.1851654052734375, -0.17464828491210938, -0.16413116455078125, -0.15361404418945312, -0.143096923828125, -0.13257980346679688, -0.12206268310546875, -0.11154556274414062, -0.1010284423828125, -0.09051132202148438, -0.07999420166015625, -0.06947708129882812, -0.0589599609375, -0.048442840576171875, -0.03792572021484375, -0.027408599853515625, -0.0168914794921875, -0.006374359130859375, 0.00414276123046875, 0.014659881591796875, 0.025177001953125, 0.035694122314453125, 0.04621124267578125, 0.056728363037109375, 0.0672454833984375, 0.07776260375976562, 0.08827972412109375, 0.09879684448242188, 0.10931396484375, 0.11983108520507812, 0.13034820556640625, 0.14086532592773438, 0.1513824462890625, 0.16189956665039062, 0.17241668701171875, 0.18293380737304688, 0.193450927734375, 0.20396804809570312, 0.21448516845703125, 0.22500228881835938, 0.2355194091796875, 0.24603652954101562, 0.25655364990234375, 0.2670707702636719, 0.277587890625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 4.0, 4.0, 13.0, 7.0, 16.0, 14.0, 19.0, 20.0, 39.0, 37.0, 53.0, 84.0, 180.0, 170.0, 118.0, 59.0, 40.0, 34.0, 27.0, 13.0, 19.0, 8.0, 5.0, 5.0, 3.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011676549911499023, -0.00011171307414770126, -0.00010666064918041229, -0.00010160822421312332, -9.655579924583435e-05, -9.150337427854538e-05, -8.645094931125641e-05, -8.139852434396744e-05, -7.634609937667847e-05, -7.12936744093895e-05, -6.624124944210052e-05, -6.118882447481155e-05, -5.613639950752258e-05, -5.108397454023361e-05, -4.603154957294464e-05, -4.097912460565567e-05, -3.59266996383667e-05, -3.087427467107773e-05, -2.5821849703788757e-05, -2.0769424736499786e-05, -1.5716999769210815e-05, -1.0664574801921844e-05, -5.6121498346328735e-06, -5.597248673439026e-07, 4.492700099945068e-06, 9.54512506723404e-06, 1.459755003452301e-05, 1.964997500181198e-05, 2.4702399969100952e-05, 2.9754824936389923e-05, 3.4807249903678894e-05, 3.9859674870967865e-05, 4.4912099838256836e-05, 4.996452480554581e-05, 5.501694977283478e-05, 6.006937474012375e-05, 6.512179970741272e-05, 7.017422467470169e-05, 7.522664964199066e-05, 8.027907460927963e-05, 8.53314995765686e-05, 9.038392454385757e-05, 9.543634951114655e-05, 0.00010048877447843552, 0.00010554119944572449, 0.00011059362441301346, 0.00011564604938030243, 0.0001206984743475914, 0.00012575089931488037, 0.00013080332428216934, 0.0001358557492494583, 0.00014090817421674728, 0.00014596059918403625, 0.00015101302415132523, 0.0001560654491186142, 0.00016111787408590317, 0.00016617029905319214, 0.0001712227240204811, 0.00017627514898777008, 0.00018132757395505905, 0.00018637999892234802, 0.000191432423889637, 0.00019648484885692596, 0.00020153727382421494, 0.0002065896987915039]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 4.0, 6.0, 6.0, 7.0, 6.0, 18.0, 20.0, 40.0, 33.0, 53.0, 67.0, 117.0, 161.0, 280.0, 462.0, 925.0, 2056.0, 5391.0, 19134.0, 91749.0, 444680.0, 381367.0, 76843.0, 16530.0, 4798.0, 1775.0, 797.0, 430.0, 263.0, 201.0, 90.0, 73.0, 45.0, 33.0, 19.0, 18.0, 14.0, 11.0, 7.0, 3.0, 3.0, 5.0, 7.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.1976318359375, -0.1916332244873047, -0.18563461303710938, -0.17963600158691406, -0.17363739013671875, -0.16763877868652344, -0.16164016723632812, -0.1556415557861328, -0.1496429443359375, -0.1436443328857422, -0.13764572143554688, -0.13164710998535156, -0.12564849853515625, -0.11964988708496094, -0.11365127563476562, -0.10765266418457031, -0.101654052734375, -0.09565544128417969, -0.08965682983398438, -0.08365821838378906, -0.07765960693359375, -0.07166099548339844, -0.06566238403320312, -0.05966377258300781, -0.0536651611328125, -0.04766654968261719, -0.041667938232421875, -0.03566932678222656, -0.02967071533203125, -0.023672103881835938, -0.017673492431640625, -0.011674880981445312, -0.00567626953125, 0.0003223419189453125, 0.006320953369140625, 0.012319564819335938, 0.01831817626953125, 0.024316787719726562, 0.030315399169921875, 0.03631401062011719, 0.0423126220703125, 0.04831123352050781, 0.054309844970703125, 0.06030845642089844, 0.06630706787109375, 0.07230567932128906, 0.07830429077148438, 0.08430290222167969, 0.090301513671875, 0.09630012512207031, 0.10229873657226562, 0.10829734802246094, 0.11429595947265625, 0.12029457092285156, 0.12629318237304688, 0.1322917938232422, 0.1382904052734375, 0.1442890167236328, 0.15028762817382812, 0.15628623962402344, 0.16228485107421875, 0.16828346252441406, 0.17428207397460938, 0.1802806854248047, 0.186279296875]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 4.0, 3.0, 4.0, 14.0, 10.0, 10.0, 21.0, 28.0, 29.0, 34.0, 55.0, 63.0, 77.0, 76.0, 97.0, 110.0, 93.0, 75.0, 55.0, 36.0, 22.0, 23.0, 19.0, 12.0, 7.0, 7.0, 2.0, 7.0, 3.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.19873046875, -0.19358444213867188, -0.18843841552734375, -0.18329238891601562, -0.1781463623046875, -0.17300033569335938, -0.16785430908203125, -0.16270828247070312, -0.157562255859375, -0.15241622924804688, -0.14727020263671875, -0.14212417602539062, -0.1369781494140625, -0.13183212280273438, -0.12668609619140625, -0.12154006958007812, -0.11639404296875, -0.11124801635742188, -0.10610198974609375, -0.10095596313476562, -0.0958099365234375, -0.09066390991210938, -0.08551788330078125, -0.08037185668945312, -0.075225830078125, -0.07007980346679688, -0.06493377685546875, -0.059787750244140625, -0.0546417236328125, -0.049495697021484375, -0.04434967041015625, -0.039203643798828125, -0.0340576171875, -0.028911590576171875, -0.02376556396484375, -0.018619537353515625, -0.0134735107421875, -0.008327484130859375, -0.00318145751953125, 0.001964569091796875, 0.007110595703125, 0.012256622314453125, 0.01740264892578125, 0.022548675537109375, 0.0276947021484375, 0.032840728759765625, 0.03798675537109375, 0.043132781982421875, 0.04827880859375, 0.053424835205078125, 0.05857086181640625, 0.06371688842773438, 0.0688629150390625, 0.07400894165039062, 0.07915496826171875, 0.08430099487304688, 0.089447021484375, 0.09459304809570312, 0.09973907470703125, 0.10488510131835938, 0.1100311279296875, 0.11517715454101562, 0.12032318115234375, 0.12546920776367188, 0.130615234375]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 6.0, 5.0, 4.0, 12.0, 11.0, 22.0, 41.0, 84.0, 185.0, 276.0, 200.0, 83.0, 44.0, 19.0, 12.0, 2.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.305366039276123, -3.1898200511932373, -3.0742740631103516, -2.9587278366088867, -2.843181848526001, -2.7276358604431152, -2.6120896339416504, -2.4965436458587646, -2.380997657775879, -2.265451669692993, -2.1499056816101074, -2.0343594551086426, -1.9188134670257568, -1.803267478942871, -1.6877213716506958, -1.5721752643585205, -1.4566292762756348, -1.341083288192749, -1.2255371809005737, -1.1099910736083984, -0.9944450855255127, -0.8788990378379822, -0.7633529901504517, -0.6478069424629211, -0.5322608947753906, -0.4167148470878601, -0.3011687994003296, -0.18562275171279907, -0.07007670402526855, 0.04546934366226196, 0.16101539134979248, 0.276561439037323, 0.3921074867248535, 0.507653534412384, 0.6231995820999146, 0.7387456297874451, 0.8542916774749756, 0.9698377251625061, 1.0853837728500366, 1.200929880142212, 1.3164758682250977, 1.4320218563079834, 1.5475679636001587, 1.663114070892334, 1.7786600589752197, 1.8942060470581055, 2.0097522735595703, 2.125298261642456, 2.240844249725342, 2.3563902378082275, 2.4719362258911133, 2.587482452392578, 2.703028440475464, 2.8185744285583496, 2.9341206550598145, 3.0496666431427, 3.165212631225586, 3.2807586193084717, 3.3963046073913574, 3.5118508338928223, 3.627396821975708, 3.7429428100585938, 3.8584890365600586, 3.9740350246429443, 4.08958101272583]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 4.0, 5.0, 7.0, 7.0, 12.0, 16.0, 14.0, 25.0, 30.0, 30.0, 39.0, 47.0, 54.0, 60.0, 56.0, 43.0, 55.0, 58.0, 57.0, 55.0, 44.0, 50.0, 45.0, 27.0, 22.0, 26.0, 28.0, 12.0, 26.0, 14.0, 8.0, 6.0, 9.0, 8.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.258880853652954, -3.158141613006592, -3.0574026107788086, -2.9566633701324463, -2.855924129486084, -2.7551848888397217, -2.6544456481933594, -2.553706645965576, -2.452967405319214, -2.3522281646728516, -2.2514891624450684, -2.150749921798706, -2.0500106811523438, -1.9492714405059814, -1.8485323190689087, -1.747793197631836, -1.6470539569854736, -1.5463147163391113, -1.4455755949020386, -1.3448364734649658, -1.2440972328186035, -1.1433579921722412, -1.0426188707351685, -0.9418796896934509, -0.8411405086517334, -0.7404013276100159, -0.6396621465682983, -0.5389229655265808, -0.4381837844848633, -0.33744460344314575, -0.23670542240142822, -0.1359662413597107, -0.035227298736572266, 0.06551188230514526, 0.1662510633468628, 0.2669902443885803, 0.36772942543029785, 0.4684686064720154, 0.5692077875137329, 0.6699469685554504, 0.770686149597168, 0.8714253306388855, 0.972164511680603, 1.0729036331176758, 1.173642873764038, 1.2743821144104004, 1.3751212358474731, 1.475860357284546, 1.5765995979309082, 1.6773388385772705, 1.7780779600143433, 1.878817081451416, 1.9795563220977783, 2.0802955627441406, 2.181034564971924, 2.281773805618286, 2.3825130462646484, 2.4832522869110107, 2.583991527557373, 2.6847305297851562, 2.7854697704315186, 2.886209011077881, 2.986948013305664, 3.0876872539520264, 3.1884264945983887]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 1.0, 4.0, 6.0, 11.0, 14.0, 14.0, 26.0, 33.0, 66.0, 107.0, 222.0, 480.0, 1019.0, 3211.0, 21715.0, 3811132.0, 341215.0, 11001.0, 2279.0, 899.0, 368.0, 160.0, 116.0, 58.0, 42.0, 29.0, 12.0, 9.0, 7.0, 8.0, 9.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.40234375, -1.36322021484375, -1.3240966796875, -1.28497314453125, -1.245849609375, -1.20672607421875, -1.1676025390625, -1.12847900390625, -1.08935546875, -1.05023193359375, -1.0111083984375, -0.97198486328125, -0.932861328125, -0.89373779296875, -0.8546142578125, -0.81549072265625, -0.7763671875, -0.73724365234375, -0.6981201171875, -0.65899658203125, -0.619873046875, -0.58074951171875, -0.5416259765625, -0.50250244140625, -0.46337890625, -0.42425537109375, -0.3851318359375, -0.34600830078125, -0.306884765625, -0.26776123046875, -0.2286376953125, -0.18951416015625, -0.150390625, -0.11126708984375, -0.0721435546875, -0.03302001953125, 0.006103515625, 0.04522705078125, 0.0843505859375, 0.12347412109375, 0.16259765625, 0.20172119140625, 0.2408447265625, 0.27996826171875, 0.319091796875, 0.35821533203125, 0.3973388671875, 0.43646240234375, 0.4755859375, 0.51470947265625, 0.5538330078125, 0.59295654296875, 0.632080078125, 0.67120361328125, 0.7103271484375, 0.74945068359375, 0.78857421875, 0.82769775390625, 0.8668212890625, 0.90594482421875, 0.945068359375, 0.98419189453125, 1.0233154296875, 1.06243896484375, 1.1015625]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 5.0, 8.0, 17.0, 28.0, 47.0, 65.0, 109.0, 101.0, 154.0, 127.0, 113.0, 76.0, 62.0, 41.0, 18.0, 12.0, 8.0, 8.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.188720703125, -0.18314170837402344, -0.17756271362304688, -0.1719837188720703, -0.16640472412109375, -0.1608257293701172, -0.15524673461914062, -0.14966773986816406, -0.1440887451171875, -0.13850975036621094, -0.13293075561523438, -0.1273517608642578, -0.12177276611328125, -0.11619377136230469, -0.11061477661132812, -0.10503578186035156, -0.099456787109375, -0.09387779235839844, -0.08829879760742188, -0.08271980285644531, -0.07714080810546875, -0.07156181335449219, -0.06598281860351562, -0.06040382385253906, -0.0548248291015625, -0.04924583435058594, -0.043666839599609375, -0.03808784484863281, -0.03250885009765625, -0.026929855346679688, -0.021350860595703125, -0.015771865844726562, -0.01019287109375, -0.0046138763427734375, 0.000965118408203125, 0.0065441131591796875, 0.01212310791015625, 0.017702102661132812, 0.023281097412109375, 0.028860092163085938, 0.0344390869140625, 0.04001808166503906, 0.045597076416015625, 0.05117607116699219, 0.05675506591796875, 0.06233406066894531, 0.06791305541992188, 0.07349205017089844, 0.079071044921875, 0.08465003967285156, 0.09022903442382812, 0.09580802917480469, 0.10138702392578125, 0.10696601867675781, 0.11254501342773438, 0.11812400817871094, 0.1237030029296875, 0.12928199768066406, 0.13486099243164062, 0.1404399871826172, 0.14601898193359375, 0.1515979766845703, 0.15717697143554688, 0.16275596618652344, 0.1683349609375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 4.0, 8.0, 14.0, 14.0, 12.0, 17.0, 34.0, 43.0, 69.0, 91.0, 136.0, 170.0, 237.0, 369.0, 589.0, 1139.0, 2978.0, 11275.0, 72019.0, 3144496.0, 905804.0, 41560.0, 8189.0, 2557.0, 1084.0, 542.0, 302.0, 162.0, 126.0, 81.0, 53.0, 36.0, 22.0, 18.0, 9.0, 11.0, 5.0, 2.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.53857421875, -0.5231285095214844, -0.5076828002929688, -0.4922370910644531, -0.4767913818359375, -0.4613456726074219, -0.44589996337890625, -0.4304542541503906, -0.415008544921875, -0.3995628356933594, -0.38411712646484375, -0.3686714172363281, -0.3532257080078125, -0.3377799987792969, -0.32233428955078125, -0.3068885803222656, -0.29144287109375, -0.2759971618652344, -0.26055145263671875, -0.24510574340820312, -0.2296600341796875, -0.21421432495117188, -0.19876861572265625, -0.18332290649414062, -0.167877197265625, -0.15243148803710938, -0.13698577880859375, -0.12154006958007812, -0.1060943603515625, -0.09064865112304688, -0.07520294189453125, -0.059757232666015625, -0.0443115234375, -0.028865814208984375, -0.01342010498046875, 0.002025604248046875, 0.0174713134765625, 0.032917022705078125, 0.04836273193359375, 0.06380844116210938, 0.079254150390625, 0.09469985961914062, 0.11014556884765625, 0.12559127807617188, 0.1410369873046875, 0.15648269653320312, 0.17192840576171875, 0.18737411499023438, 0.20281982421875, 0.21826553344726562, 0.23371124267578125, 0.24915695190429688, 0.2646026611328125, 0.2800483703613281, 0.29549407958984375, 0.3109397888183594, 0.326385498046875, 0.3418312072753906, 0.35727691650390625, 0.3727226257324219, 0.3881683349609375, 0.4036140441894531, 0.41905975341796875, 0.4345054626464844, 0.449951171875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 6.0, 16.0, 21.0, 29.0, 48.0, 116.0, 303.0, 1155.0, 1700.0, 363.0, 157.0, 69.0, 41.0, 13.0, 14.0, 12.0, 6.0, 1.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.261962890625, -0.2552661895751953, -0.24856948852539062, -0.24187278747558594, -0.23517608642578125, -0.22847938537597656, -0.22178268432617188, -0.2150859832763672, -0.2083892822265625, -0.2016925811767578, -0.19499588012695312, -0.18829917907714844, -0.18160247802734375, -0.17490577697753906, -0.16820907592773438, -0.1615123748779297, -0.154815673828125, -0.1481189727783203, -0.14142227172851562, -0.13472557067871094, -0.12802886962890625, -0.12133216857910156, -0.11463546752929688, -0.10793876647949219, -0.1012420654296875, -0.09454536437988281, -0.08784866333007812, -0.08115196228027344, -0.07445526123046875, -0.06775856018066406, -0.061061859130859375, -0.05436515808105469, -0.04766845703125, -0.04097175598144531, -0.034275054931640625, -0.027578353881835938, -0.02088165283203125, -0.014184951782226562, -0.007488250732421875, -0.0007915496826171875, 0.0059051513671875, 0.012601852416992188, 0.019298553466796875, 0.025995254516601562, 0.03269195556640625, 0.03938865661621094, 0.046085357666015625, 0.05278205871582031, 0.059478759765625, 0.06617546081542969, 0.07287216186523438, 0.07956886291503906, 0.08626556396484375, 0.09296226501464844, 0.09965896606445312, 0.10635566711425781, 0.1130523681640625, 0.11974906921386719, 0.12644577026367188, 0.13314247131347656, 0.13983917236328125, 0.14653587341308594, 0.15323257446289062, 0.1599292755126953, 0.1666259765625]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 7.0, 21.0, 79.0, 247.0, 395.0, 177.0, 56.0, 14.0, 5.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2514867782592773, -1.2057465314865112, -1.1600062847137451, -1.114266037940979, -1.068525791168213, -1.0227855443954468, -0.9770452976226807, -0.9313050508499146, -0.8855648040771484, -0.8398245573043823, -0.7940843105316162, -0.7483440637588501, -0.702603816986084, -0.6568635702133179, -0.6111233234405518, -0.5653830766677856, -0.5196428894996643, -0.4739026427268982, -0.4281623959541321, -0.38242214918136597, -0.33668190240859985, -0.29094165563583374, -0.24520143866539001, -0.1994611918926239, -0.1537209451198578, -0.10798069834709167, -0.06224045902490616, -0.016500219702720642, 0.02924002707004547, 0.07498027384281158, 0.1207205057144165, 0.16646075248718262, 0.21220099925994873, 0.25794124603271484, 0.30368149280548096, 0.34942173957824707, 0.3951619863510132, 0.4409022331237793, 0.486642450094223, 0.5323827266693115, 0.5781229734420776, 0.6238632202148438, 0.6696034669876099, 0.715343713760376, 0.7610839605331421, 0.8068242073059082, 0.8525644540786743, 0.8983047008514404, 0.9440448880195618, 0.9897851347923279, 1.0355253219604492, 1.0812655687332153, 1.1270058155059814, 1.1727460622787476, 1.2184863090515137, 1.2642265558242798, 1.309966802597046, 1.355707049369812, 1.4014472961425781, 1.4471875429153442, 1.4929277896881104, 1.5386680364608765, 1.5844082832336426, 1.6301485300064087, 1.6758887767791748]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 6.0, 0.0, 4.0, 8.0, 11.0, 16.0, 16.0, 12.0, 30.0, 23.0, 27.0, 38.0, 47.0, 58.0, 41.0, 50.0, 54.0, 64.0, 55.0, 46.0, 62.0, 42.0, 43.0, 54.0, 35.0, 30.0, 40.0, 20.0, 19.0, 15.0, 8.0, 11.0, 3.0, 5.0, 3.0, 4.0, 4.0, 6.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5758954286575317, -0.5598230361938477, -0.5437506437301636, -0.5276781916618347, -0.5116057991981506, -0.49553340673446655, -0.47946101427078247, -0.463388592004776, -0.44731616973876953, -0.43124377727508545, -0.415171355009079, -0.3990989625453949, -0.3830265402793884, -0.36695414781570435, -0.35088175535202026, -0.3348093330860138, -0.3187369406223297, -0.30266454815864563, -0.28659212589263916, -0.2705197334289551, -0.2544473111629486, -0.23837491869926453, -0.22230251133441925, -0.20623010396957397, -0.1901576966047287, -0.17408528923988342, -0.15801288187503815, -0.14194047451019287, -0.1258680820465088, -0.10979566723108292, -0.09372326731681824, -0.07765085995197296, -0.061578452587127686, -0.04550604522228241, -0.029433641582727432, -0.013361237943172455, 0.002711169421672821, 0.018783576786518097, 0.034855976700782776, 0.05092838406562805, 0.06700079143047333, 0.0830731987953186, 0.09914560616016388, 0.11521800607442856, 0.13129040598869324, 0.1473628282546997, 0.1634352207183838, 0.17950762808322906, 0.19558003544807434, 0.21165244281291962, 0.2277248501777649, 0.24379724264144897, 0.25986966490745544, 0.2759420573711395, 0.292014479637146, 0.3080868721008301, 0.32415926456451416, 0.34023165702819824, 0.3563040792942047, 0.3723764717578888, 0.38844889402389526, 0.40452128648757935, 0.4205936789512634, 0.4366661012172699, 0.45273852348327637]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 7.0, 8.0, 5.0, 6.0, 13.0, 20.0, 19.0, 20.0, 28.0, 51.0, 67.0, 95.0, 114.0, 153.0, 193.0, 322.0, 489.0, 793.0, 1481.0, 3037.0, 7577.0, 23799.0, 98823.0, 461130.0, 350606.0, 69722.0, 17996.0, 6124.0, 2516.0, 1207.0, 714.0, 418.0, 252.0, 189.0, 169.0, 90.0, 75.0, 52.0, 49.0, 36.0, 17.0, 24.0, 15.0, 11.0, 7.0, 7.0, 4.0, 6.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.35791015625, -0.3470268249511719, -0.33614349365234375, -0.3252601623535156, -0.3143768310546875, -0.3034934997558594, -0.29261016845703125, -0.2817268371582031, -0.270843505859375, -0.2599601745605469, -0.24907684326171875, -0.23819351196289062, -0.2273101806640625, -0.21642684936523438, -0.20554351806640625, -0.19466018676757812, -0.18377685546875, -0.17289352416992188, -0.16201019287109375, -0.15112686157226562, -0.1402435302734375, -0.12936019897460938, -0.11847686767578125, -0.10759353637695312, -0.096710205078125, -0.08582687377929688, -0.07494354248046875, -0.06406021118164062, -0.0531768798828125, -0.042293548583984375, -0.03141021728515625, -0.020526885986328125, -0.0096435546875, 0.001239776611328125, 0.01212310791015625, 0.023006439208984375, 0.0338897705078125, 0.044773101806640625, 0.05565643310546875, 0.06653976440429688, 0.077423095703125, 0.08830642700195312, 0.09918975830078125, 0.11007308959960938, 0.1209564208984375, 0.13183975219726562, 0.14272308349609375, 0.15360641479492188, 0.16448974609375, 0.17537307739257812, 0.18625640869140625, 0.19713973999023438, 0.2080230712890625, 0.21890640258789062, 0.22978973388671875, 0.24067306518554688, 0.251556396484375, 0.2624397277832031, 0.27332305908203125, 0.2842063903808594, 0.2950897216796875, 0.3059730529785156, 0.31685638427734375, 0.3277397155761719, 0.338623046875]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 7.0, 10.0, 20.0, 46.0, 50.0, 83.0, 100.0, 124.0, 147.0, 142.0, 84.0, 74.0, 42.0, 34.0, 17.0, 9.0, 5.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.173095703125, -0.1677532196044922, -0.16241073608398438, -0.15706825256347656, -0.15172576904296875, -0.14638328552246094, -0.14104080200195312, -0.1356983184814453, -0.1303558349609375, -0.1250133514404297, -0.11967086791992188, -0.11432838439941406, -0.10898590087890625, -0.10364341735839844, -0.09830093383789062, -0.09295845031738281, -0.087615966796875, -0.08227348327636719, -0.07693099975585938, -0.07158851623535156, -0.06624603271484375, -0.06090354919433594, -0.055561065673828125, -0.05021858215332031, -0.0448760986328125, -0.03953361511230469, -0.034191131591796875, -0.028848648071289062, -0.02350616455078125, -0.018163681030273438, -0.012821197509765625, -0.0074787139892578125, -0.00213623046875, 0.0032062530517578125, 0.008548736572265625, 0.013891220092773438, 0.01923370361328125, 0.024576187133789062, 0.029918670654296875, 0.03526115417480469, 0.0406036376953125, 0.04594612121582031, 0.051288604736328125, 0.05663108825683594, 0.06197357177734375, 0.06731605529785156, 0.07265853881835938, 0.07800102233886719, 0.083343505859375, 0.08868598937988281, 0.09402847290039062, 0.09937095642089844, 0.10471343994140625, 0.11005592346191406, 0.11539840698242188, 0.12074089050292969, 0.1260833740234375, 0.1314258575439453, 0.13676834106445312, 0.14211082458496094, 0.14745330810546875, 0.15279579162597656, 0.15813827514648438, 0.1634807586669922, 0.1688232421875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 6.0, 11.0, 4.0, 6.0, 11.0, 12.0, 25.0, 21.0, 22.0, 43.0, 69.0, 77.0, 116.0, 168.0, 301.0, 467.0, 765.0, 1539.0, 3051.0, 6495.0, 15869.0, 44665.0, 154091.0, 424163.0, 275506.0, 76902.0, 25078.0, 9844.0, 4358.0, 2068.0, 1113.0, 615.0, 338.0, 210.0, 152.0, 104.0, 68.0, 52.0, 39.0, 34.0, 22.0, 14.0, 12.0, 11.0, 8.0, 3.0, 3.0, 6.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2890625, -0.2799530029296875, -0.270843505859375, -0.2617340087890625, -0.25262451171875, -0.2435150146484375, -0.234405517578125, -0.2252960205078125, -0.2161865234375, -0.2070770263671875, -0.197967529296875, -0.1888580322265625, -0.17974853515625, -0.1706390380859375, -0.161529541015625, -0.1524200439453125, -0.143310546875, -0.1342010498046875, -0.125091552734375, -0.1159820556640625, -0.10687255859375, -0.0977630615234375, -0.088653564453125, -0.0795440673828125, -0.0704345703125, -0.0613250732421875, -0.052215576171875, -0.0431060791015625, -0.03399658203125, -0.0248870849609375, -0.015777587890625, -0.0066680908203125, 0.00244140625, 0.0115509033203125, 0.020660400390625, 0.0297698974609375, 0.03887939453125, 0.0479888916015625, 0.057098388671875, 0.0662078857421875, 0.0753173828125, 0.0844268798828125, 0.093536376953125, 0.1026458740234375, 0.11175537109375, 0.1208648681640625, 0.129974365234375, 0.1390838623046875, 0.148193359375, 0.1573028564453125, 0.166412353515625, 0.1755218505859375, 0.18463134765625, 0.1937408447265625, 0.202850341796875, 0.2119598388671875, 0.2210693359375, 0.2301788330078125, 0.239288330078125, 0.2483978271484375, 0.25750732421875, 0.2666168212890625, 0.275726318359375, 0.2848358154296875, 0.2939453125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 6.0, 5.0, 4.0, 5.0, 5.0, 5.0, 4.0, 8.0, 17.0, 16.0, 16.0, 18.0, 25.0, 18.0, 34.0, 43.0, 36.0, 58.0, 35.0, 45.0, 36.0, 38.0, 50.0, 49.0, 38.0, 42.0, 46.0, 44.0, 29.0, 34.0, 37.0, 18.0, 24.0, 25.0, 13.0, 9.0, 8.0, 11.0, 12.0, 14.0, 5.0, 9.0, 5.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.40283203125, -0.3906669616699219, -0.37850189208984375, -0.3663368225097656, -0.3541717529296875, -0.3420066833496094, -0.32984161376953125, -0.3176765441894531, -0.305511474609375, -0.2933464050292969, -0.28118133544921875, -0.2690162658691406, -0.2568511962890625, -0.24468612670898438, -0.23252105712890625, -0.22035598754882812, -0.20819091796875, -0.19602584838867188, -0.18386077880859375, -0.17169570922851562, -0.1595306396484375, -0.14736557006835938, -0.13520050048828125, -0.12303543090820312, -0.110870361328125, -0.09870529174804688, -0.08654022216796875, -0.07437515258789062, -0.0622100830078125, -0.050045013427734375, -0.03787994384765625, -0.025714874267578125, -0.0135498046875, -0.001384735107421875, 0.01078033447265625, 0.022945404052734375, 0.0351104736328125, 0.047275543212890625, 0.05944061279296875, 0.07160568237304688, 0.083770751953125, 0.09593582153320312, 0.10810089111328125, 0.12026596069335938, 0.1324310302734375, 0.14459609985351562, 0.15676116943359375, 0.16892623901367188, 0.18109130859375, 0.19325637817382812, 0.20542144775390625, 0.21758651733398438, 0.2297515869140625, 0.24191665649414062, 0.25408172607421875, 0.2662467956542969, 0.278411865234375, 0.2905769348144531, 0.30274200439453125, 0.3149070739746094, 0.3270721435546875, 0.3392372131347656, 0.35140228271484375, 0.3635673522949219, 0.375732421875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 2.0, 4.0, 6.0, 11.0, 8.0, 11.0, 11.0, 8.0, 35.0, 38.0, 64.0, 83.0, 167.0, 289.0, 532.0, 1110.0, 2822.0, 8695.0, 33783.0, 158749.0, 534955.0, 238954.0, 49260.0, 12356.0, 3721.0, 1464.0, 599.0, 327.0, 185.0, 113.0, 52.0, 42.0, 28.0, 16.0, 14.0, 7.0, 8.0, 6.0, 11.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0], "bins": [-0.11907958984375, -0.1158285140991211, -0.11257743835449219, -0.10932636260986328, -0.10607528686523438, -0.10282421112060547, -0.09957313537597656, -0.09632205963134766, -0.09307098388671875, -0.08981990814208984, -0.08656883239746094, -0.08331775665283203, -0.08006668090820312, -0.07681560516357422, -0.07356452941894531, -0.0703134536743164, -0.0670623779296875, -0.0638113021850586, -0.06056022644042969, -0.05730915069580078, -0.054058074951171875, -0.05080699920654297, -0.04755592346191406, -0.044304847717285156, -0.04105377197265625, -0.037802696228027344, -0.03455162048339844, -0.03130054473876953, -0.028049468994140625, -0.02479839324951172, -0.021547317504882812, -0.018296241760253906, -0.015045166015625, -0.011794090270996094, -0.008543014526367188, -0.005291938781738281, -0.002040863037109375, 0.0012102127075195312, 0.0044612884521484375, 0.007712364196777344, 0.01096343994140625, 0.014214515686035156, 0.017465591430664062, 0.02071666717529297, 0.023967742919921875, 0.02721881866455078, 0.030469894409179688, 0.033720970153808594, 0.0369720458984375, 0.040223121643066406, 0.04347419738769531, 0.04672527313232422, 0.049976348876953125, 0.05322742462158203, 0.05647850036621094, 0.059729576110839844, 0.06298065185546875, 0.06623172760009766, 0.06948280334472656, 0.07273387908935547, 0.07598495483398438, 0.07923603057861328, 0.08248710632324219, 0.0857381820678711, 0.0889892578125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 8.0, 12.0, 11.0, 21.0, 26.0, 35.0, 37.0, 52.0, 96.0, 134.0, 142.0, 126.0, 88.0, 59.0, 45.0, 33.0, 24.0, 18.0, 11.0, 11.0, 6.0, 0.0, 5.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00020694732666015625, -0.00020219851285219193, -0.0001974496990442276, -0.00019270088523626328, -0.00018795207142829895, -0.00018320325762033463, -0.0001784544438123703, -0.00017370563000440598, -0.00016895681619644165, -0.00016420800238847733, -0.000159459188580513, -0.00015471037477254868, -0.00014996156096458435, -0.00014521274715662003, -0.0001404639333486557, -0.00013571511954069138, -0.00013096630573272705, -0.00012621749192476273, -0.0001214686781167984, -0.00011671986430883408, -0.00011197105050086975, -0.00010722223669290543, -0.0001024734228849411, -9.772460907697678e-05, -9.297579526901245e-05, -8.822698146104813e-05, -8.34781676530838e-05, -7.872935384511948e-05, -7.398054003715515e-05, -6.923172622919083e-05, -6.44829124212265e-05, -5.9734098613262177e-05, -5.498528480529785e-05, -5.0236470997333527e-05, -4.54876571893692e-05, -4.073884338140488e-05, -3.599002957344055e-05, -3.124121576547623e-05, -2.6492401957511902e-05, -2.1743588149547577e-05, -1.6994774341583252e-05, -1.2245960533618927e-05, -7.497146725654602e-06, -2.748332917690277e-06, 2.000480890274048e-06, 6.749294698238373e-06, 1.1498108506202698e-05, 1.6246922314167023e-05, 2.0995736122131348e-05, 2.5744549930095673e-05, 3.0493363738059998e-05, 3.524217754602432e-05, 3.999099135398865e-05, 4.473980516195297e-05, 4.94886189699173e-05, 5.423743277788162e-05, 5.898624658584595e-05, 6.373506039381027e-05, 6.84838742017746e-05, 7.323268800973892e-05, 7.798150181770325e-05, 8.273031562566757e-05, 8.74791294336319e-05, 9.222794324159622e-05, 9.697675704956055e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 8.0, 6.0, 13.0, 14.0, 23.0, 46.0, 51.0, 92.0, 148.0, 213.0, 414.0, 769.0, 1629.0, 4070.0, 12952.0, 53072.0, 251757.0, 530099.0, 146607.0, 32512.0, 8529.0, 2849.0, 1258.0, 591.0, 325.0, 166.0, 122.0, 57.0, 41.0, 31.0, 17.0, 21.0, 17.0, 10.0, 7.0, 6.0, 3.0, 6.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.11688232421875, -0.11347770690917969, -0.11007308959960938, -0.10666847229003906, -0.10326385498046875, -0.09985923767089844, -0.09645462036132812, -0.09305000305175781, -0.0896453857421875, -0.08624076843261719, -0.08283615112304688, -0.07943153381347656, -0.07602691650390625, -0.07262229919433594, -0.06921768188476562, -0.06581306457519531, -0.062408447265625, -0.05900382995605469, -0.055599212646484375, -0.05219459533691406, -0.04878997802734375, -0.04538536071777344, -0.041980743408203125, -0.03857612609863281, -0.0351715087890625, -0.03176689147949219, -0.028362274169921875, -0.024957656860351562, -0.02155303955078125, -0.018148422241210938, -0.014743804931640625, -0.011339187622070312, -0.0079345703125, -0.0045299530029296875, -0.001125335693359375, 0.0022792816162109375, 0.00568389892578125, 0.009088516235351562, 0.012493133544921875, 0.015897750854492188, 0.0193023681640625, 0.022706985473632812, 0.026111602783203125, 0.029516220092773438, 0.03292083740234375, 0.03632545471191406, 0.039730072021484375, 0.04313468933105469, 0.046539306640625, 0.04994392395019531, 0.053348541259765625, 0.05675315856933594, 0.06015777587890625, 0.06356239318847656, 0.06696701049804688, 0.07037162780761719, 0.0737762451171875, 0.07718086242675781, 0.08058547973632812, 0.08399009704589844, 0.08739471435546875, 0.09079933166503906, 0.09420394897460938, 0.09760856628417969, 0.10101318359375]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 5.0, 8.0, 17.0, 18.0, 28.0, 41.0, 67.0, 85.0, 105.0, 106.0, 110.0, 108.0, 97.0, 55.0, 53.0, 33.0, 30.0, 13.0, 9.0, 4.0, 4.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1502685546875, -0.14612293243408203, -0.14197731018066406, -0.1378316879272461, -0.13368606567382812, -0.12954044342041016, -0.1253948211669922, -0.12124919891357422, -0.11710357666015625, -0.11295795440673828, -0.10881233215332031, -0.10466670989990234, -0.10052108764648438, -0.0963754653930664, -0.09222984313964844, -0.08808422088623047, -0.0839385986328125, -0.07979297637939453, -0.07564735412597656, -0.0715017318725586, -0.06735610961914062, -0.06321048736572266, -0.05906486511230469, -0.05491924285888672, -0.05077362060546875, -0.04662799835205078, -0.04248237609863281, -0.038336753845214844, -0.034191131591796875, -0.030045509338378906, -0.025899887084960938, -0.02175426483154297, -0.017608642578125, -0.013463020324707031, -0.009317398071289062, -0.005171775817871094, -0.001026153564453125, 0.0031194686889648438, 0.0072650909423828125, 0.011410713195800781, 0.01555633544921875, 0.01970195770263672, 0.023847579956054688, 0.027993202209472656, 0.032138824462890625, 0.036284446716308594, 0.04043006896972656, 0.04457569122314453, 0.0487213134765625, 0.05286693572998047, 0.05701255798339844, 0.061158180236816406, 0.06530380249023438, 0.06944942474365234, 0.07359504699707031, 0.07774066925048828, 0.08188629150390625, 0.08603191375732422, 0.09017753601074219, 0.09432315826416016, 0.09846878051757812, 0.1026144027709961, 0.10676002502441406, 0.11090564727783203, 0.11505126953125]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 4.0, 19.0, 9.0, 13.0, 39.0, 54.0, 122.0, 204.0, 226.0, 118.0, 79.0, 37.0, 23.0, 21.0, 16.0, 7.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.877943515777588, -1.7968614101409912, -1.715779423713684, -1.6346973180770874, -1.5536153316497803, -1.4725332260131836, -1.391451120376587, -1.3103690147399902, -1.229287028312683, -1.1482049226760864, -1.0671229362487793, -0.9860408306121826, -0.9049587845802307, -0.8238767385482788, -0.7427946329116821, -0.6617125868797302, -0.5806305408477783, -0.4995484948158264, -0.4184664189815521, -0.33738434314727783, -0.2563022971153259, -0.17522025108337402, -0.09413817524909973, -0.01305609941482544, 0.06802594661712646, 0.14910800755023956, 0.23019006848335266, 0.31127214431762695, 0.39235419034957886, 0.47343623638153076, 0.5545183420181274, 0.6356003880500793, 0.7166826725006104, 0.7977647185325623, 0.8788467645645142, 0.9599288702011108, 1.041010856628418, 1.1220929622650146, 1.2031750679016113, 1.284257173538208, 1.3653391599655151, 1.4464212656021118, 1.527503252029419, 1.6085853576660156, 1.6896674633026123, 1.7707494497299194, 1.8518315553665161, 1.9329135417938232, 2.01399564743042, 2.0950777530670166, 2.1761598587036133, 2.257241725921631, 2.3383238315582275, 2.419405937194824, 2.500488042831421, 2.5815701484680176, 2.662652015686035, 2.743734121322632, 2.8248162269592285, 2.905898094177246, 2.9869801998138428, 3.0680623054504395, 3.149144411087036, 3.230226516723633, 3.3113086223602295]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 4.0, 3.0, 4.0, 3.0, 3.0, 2.0, 5.0, 3.0, 7.0, 9.0, 12.0, 10.0, 9.0, 16.0, 25.0, 21.0, 33.0, 26.0, 32.0, 36.0, 40.0, 47.0, 35.0, 43.0, 50.0, 41.0, 47.0, 47.0, 51.0, 42.0, 38.0, 36.0, 28.0, 27.0, 30.0, 20.0, 16.0, 17.0, 9.0, 12.0, 10.0, 7.0, 9.0, 8.0, 6.0, 8.0, 2.0, 3.0, 2.0, 1.0, 7.0, 1.0, 3.0, 2.0, 1.0, 1.0], "bins": [-2.3410449028015137, -2.270845651626587, -2.20064640045166, -2.1304471492767334, -2.0602478981018066, -1.9900486469268799, -1.9198493957519531, -1.8496501445770264, -1.7794508934020996, -1.7092516422271729, -1.639052391052246, -1.5688531398773193, -1.4986538887023926, -1.4284546375274658, -1.358255386352539, -1.2880561351776123, -1.2178568840026855, -1.1476576328277588, -1.077458381652832, -1.0072591304779053, -0.9370598793029785, -0.8668606281280518, -0.796661376953125, -0.7264621257781982, -0.6562628746032715, -0.5860636234283447, -0.515864372253418, -0.4456651210784912, -0.37546586990356445, -0.3052666187286377, -0.23506736755371094, -0.16486811637878418, -0.09466910362243652, -0.024469852447509766, 0.04572939872741699, 0.11592864990234375, 0.1861279010772705, 0.25632715225219727, 0.326526403427124, 0.3967256546020508, 0.46692490577697754, 0.5371241569519043, 0.607323408126831, 0.6775226593017578, 0.7477219104766846, 0.8179211616516113, 0.8881204128265381, 0.9583196640014648, 1.0285189151763916, 1.0987181663513184, 1.1689174175262451, 1.2391166687011719, 1.3093159198760986, 1.3795151710510254, 1.4497144222259521, 1.519913673400879, 1.5901129245758057, 1.6603121757507324, 1.7305114269256592, 1.800710678100586, 1.8709099292755127, 1.9411091804504395, 2.011308431625366, 2.081507682800293, 2.1517069339752197]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 8.0, 5.0, 11.0, 13.0, 20.0, 19.0, 43.0, 81.0, 131.0, 253.0, 515.0, 1164.0, 3306.0, 11711.0, 103406.0, 3962158.0, 94279.0, 11448.0, 3072.0, 1296.0, 563.0, 276.0, 176.0, 96.0, 60.0, 56.0, 33.0, 23.0, 17.0, 13.0, 10.0, 5.0, 2.0, 2.0, 3.0, 5.0, 1.0, 3.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5205078125, -0.5022354125976562, -0.4839630126953125, -0.46569061279296875, -0.447418212890625, -0.42914581298828125, -0.4108734130859375, -0.39260101318359375, -0.37432861328125, -0.35605621337890625, -0.3377838134765625, -0.31951141357421875, -0.301239013671875, -0.28296661376953125, -0.2646942138671875, -0.24642181396484375, -0.2281494140625, -0.20987701416015625, -0.1916046142578125, -0.17333221435546875, -0.155059814453125, -0.13678741455078125, -0.1185150146484375, -0.10024261474609375, -0.08197021484375, -0.06369781494140625, -0.0454254150390625, -0.02715301513671875, -0.008880615234375, 0.00939178466796875, 0.0276641845703125, 0.04593658447265625, 0.064208984375, 0.08248138427734375, 0.1007537841796875, 0.11902618408203125, 0.137298583984375, 0.15557098388671875, 0.1738433837890625, 0.19211578369140625, 0.21038818359375, 0.22866058349609375, 0.2469329833984375, 0.26520538330078125, 0.283477783203125, 0.30175018310546875, 0.3200225830078125, 0.33829498291015625, 0.3565673828125, 0.37483978271484375, 0.3931121826171875, 0.41138458251953125, 0.429656982421875, 0.44792938232421875, 0.4662017822265625, 0.48447418212890625, 0.50274658203125, 0.5210189819335938, 0.5392913818359375, 0.5575637817382812, 0.575836181640625, 0.5941085815429688, 0.6123809814453125, 0.6306533813476562, 0.64892578125]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 7.0, 10.0, 15.0, 24.0, 39.0, 40.0, 71.0, 95.0, 99.0, 102.0, 134.0, 98.0, 82.0, 62.0, 39.0, 34.0, 17.0, 13.0, 8.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1492919921875, -0.14429283142089844, -0.13929367065429688, -0.1342945098876953, -0.12929534912109375, -0.12429618835449219, -0.11929702758789062, -0.11429786682128906, -0.1092987060546875, -0.10429954528808594, -0.09930038452148438, -0.09430122375488281, -0.08930206298828125, -0.08430290222167969, -0.07930374145507812, -0.07430458068847656, -0.069305419921875, -0.06430625915527344, -0.059307098388671875, -0.05430793762207031, -0.04930877685546875, -0.04430961608886719, -0.039310455322265625, -0.03431129455566406, -0.0293121337890625, -0.024312973022460938, -0.019313812255859375, -0.014314651489257812, -0.00931549072265625, -0.0043163299560546875, 0.000682830810546875, 0.0056819915771484375, 0.01068115234375, 0.015680313110351562, 0.020679473876953125, 0.025678634643554688, 0.03067779541015625, 0.03567695617675781, 0.040676116943359375, 0.04567527770996094, 0.0506744384765625, 0.05567359924316406, 0.060672760009765625, 0.06567192077636719, 0.07067108154296875, 0.07567024230957031, 0.08066940307617188, 0.08566856384277344, 0.090667724609375, 0.09566688537597656, 0.10066604614257812, 0.10566520690917969, 0.11066436767578125, 0.11566352844238281, 0.12066268920898438, 0.12566184997558594, 0.1306610107421875, 0.13566017150878906, 0.14065933227539062, 0.1456584930419922, 0.15065765380859375, 0.1556568145751953, 0.16065597534179688, 0.16565513610839844, 0.170654296875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 4.0, 2.0, 5.0, 14.0, 10.0, 22.0, 30.0, 42.0, 65.0, 105.0, 166.0, 297.0, 538.0, 969.0, 2116.0, 5619.0, 20177.0, 130557.0, 3324234.0, 641029.0, 49631.0, 11169.0, 3903.0, 1625.0, 809.0, 456.0, 258.0, 164.0, 98.0, 66.0, 42.0, 24.0, 15.0, 11.0, 4.0, 1.0, 3.0, 6.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.28466796875, -0.27597808837890625, -0.2672882080078125, -0.25859832763671875, -0.249908447265625, -0.24121856689453125, -0.2325286865234375, -0.22383880615234375, -0.21514892578125, -0.20645904541015625, -0.1977691650390625, -0.18907928466796875, -0.180389404296875, -0.17169952392578125, -0.1630096435546875, -0.15431976318359375, -0.1456298828125, -0.13694000244140625, -0.1282501220703125, -0.11956024169921875, -0.110870361328125, -0.10218048095703125, -0.0934906005859375, -0.08480072021484375, -0.07611083984375, -0.06742095947265625, -0.0587310791015625, -0.05004119873046875, -0.041351318359375, -0.03266143798828125, -0.0239715576171875, -0.01528167724609375, -0.006591796875, 0.00209808349609375, 0.0107879638671875, 0.01947784423828125, 0.028167724609375, 0.03685760498046875, 0.0455474853515625, 0.05423736572265625, 0.06292724609375, 0.07161712646484375, 0.0803070068359375, 0.08899688720703125, 0.097686767578125, 0.10637664794921875, 0.1150665283203125, 0.12375640869140625, 0.1324462890625, 0.14113616943359375, 0.1498260498046875, 0.15851593017578125, 0.167205810546875, 0.17589569091796875, 0.1845855712890625, 0.19327545166015625, 0.20196533203125, 0.21065521240234375, 0.2193450927734375, 0.22803497314453125, 0.236724853515625, 0.24541473388671875, 0.2541046142578125, 0.26279449462890625, 0.271484375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 1.0, 3.0, 4.0, 4.0, 15.0, 5.0, 15.0, 30.0, 31.0, 74.0, 124.0, 297.0, 848.0, 1569.0, 546.0, 216.0, 108.0, 63.0, 34.0, 24.0, 16.0, 12.0, 9.0, 7.0, 5.0, 4.0, 4.0, 2.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1004638671875, -0.09725093841552734, -0.09403800964355469, -0.09082508087158203, -0.08761215209960938, -0.08439922332763672, -0.08118629455566406, -0.0779733657836914, -0.07476043701171875, -0.0715475082397461, -0.06833457946777344, -0.06512165069580078, -0.061908721923828125, -0.05869579315185547, -0.05548286437988281, -0.052269935607910156, -0.0490570068359375, -0.045844078063964844, -0.04263114929199219, -0.03941822052001953, -0.036205291748046875, -0.03299236297607422, -0.029779434204101562, -0.026566505432128906, -0.02335357666015625, -0.020140647888183594, -0.016927719116210938, -0.013714790344238281, -0.010501861572265625, -0.007288932800292969, -0.0040760040283203125, -0.0008630752563476562, 0.002349853515625, 0.005562782287597656, 0.008775711059570312, 0.011988639831542969, 0.015201568603515625, 0.01841449737548828, 0.021627426147460938, 0.024840354919433594, 0.02805328369140625, 0.031266212463378906, 0.03447914123535156, 0.03769207000732422, 0.040904998779296875, 0.04411792755126953, 0.04733085632324219, 0.050543785095214844, 0.0537567138671875, 0.056969642639160156, 0.06018257141113281, 0.06339550018310547, 0.06660842895507812, 0.06982135772705078, 0.07303428649902344, 0.0762472152709961, 0.07946014404296875, 0.0826730728149414, 0.08588600158691406, 0.08909893035888672, 0.09231185913085938, 0.09552478790283203, 0.09873771667480469, 0.10195064544677734, 0.10516357421875]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 2.0, 2.0, 6.0, 10.0, 30.0, 60.0, 124.0, 212.0, 223.0, 186.0, 76.0, 45.0, 14.0, 8.0, 7.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7238551378250122, -0.7037040591239929, -0.6835530400276184, -0.6634019613265991, -0.6432509422302246, -0.6230998635292053, -0.6029488444328308, -0.5827977657318115, -0.562646746635437, -0.5424956679344177, -0.5223446488380432, -0.5021935701370239, -0.4820425510406494, -0.4618914723396301, -0.4417404234409332, -0.42158937454223633, -0.40143829584121704, -0.38128724694252014, -0.36113619804382324, -0.34098514914512634, -0.32083410024642944, -0.30068302154541016, -0.28053197264671326, -0.26038092374801636, -0.24022987484931946, -0.22007882595062256, -0.19992777705192566, -0.17977671325206757, -0.15962566435337067, -0.13947461545467377, -0.11932355910539627, -0.09917250275611877, -0.0790213942527771, -0.0588703416287899, -0.038719289004802704, -0.018568236380815506, 0.001582816243171692, 0.02173386514186859, 0.04188492149114609, 0.062035977840423584, 0.08218702673912048, 0.10233807563781738, 0.12248913198709488, 0.14264018833637238, 0.16279123723506927, 0.18294228613376617, 0.20309334993362427, 0.22324439883232117, 0.24339544773101807, 0.26354649662971497, 0.28369754552841187, 0.30384859442710876, 0.32399964332580566, 0.34415072202682495, 0.36430177092552185, 0.38445281982421875, 0.40460386872291565, 0.42475491762161255, 0.44490596652030945, 0.46505701541900635, 0.48520809412002563, 0.5053591132164001, 0.5255101919174194, 0.545661211013794, 0.5658122897148132]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 2.0, 3.0, 6.0, 6.0, 9.0, 5.0, 13.0, 13.0, 14.0, 11.0, 20.0, 30.0, 23.0, 34.0, 30.0, 52.0, 52.0, 39.0, 45.0, 43.0, 43.0, 47.0, 46.0, 36.0, 40.0, 45.0, 49.0, 36.0, 35.0, 25.0, 33.0, 25.0, 18.0, 17.0, 13.0, 15.0, 11.0, 9.0, 3.0, 6.0, 2.0, 3.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.24737590551376343, -0.23817496001720428, -0.22897401452064514, -0.219773069024086, -0.21057212352752686, -0.2013711780309677, -0.19217023253440857, -0.18296928703784943, -0.17376834154129028, -0.16456739604473114, -0.155366450548172, -0.14616550505161285, -0.1369645595550537, -0.12776361405849457, -0.11856266856193542, -0.10936172306537628, -0.10016077756881714, -0.090959832072258, -0.08175888657569885, -0.07255794107913971, -0.06335699558258057, -0.05415605008602142, -0.04495510458946228, -0.03575415909290314, -0.026553213596343994, -0.01735226809978485, -0.008151322603225708, 0.001049622893333435, 0.010250568389892578, 0.01945151388645172, 0.028652459383010864, 0.03785340487957001, 0.04705435037612915, 0.05625529587268829, 0.06545624136924744, 0.07465718686580658, 0.08385813236236572, 0.09305907785892487, 0.10226002335548401, 0.11146096885204315, 0.1206619143486023, 0.12986285984516144, 0.13906380534172058, 0.14826475083827972, 0.15746569633483887, 0.166666641831398, 0.17586758732795715, 0.1850685328245163, 0.19426947832107544, 0.20347042381763458, 0.21267136931419373, 0.22187231481075287, 0.231073260307312, 0.24027420580387115, 0.2494751513004303, 0.25867611169815063, 0.2678770422935486, 0.27707797288894653, 0.28627893328666687, 0.2954798936843872, 0.30468082427978516, 0.3138817548751831, 0.32308271527290344, 0.3322836756706238, 0.34148460626602173]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 4.0, 8.0, 10.0, 15.0, 14.0, 33.0, 30.0, 55.0, 62.0, 126.0, 160.0, 278.0, 466.0, 761.0, 1500.0, 3517.0, 9578.0, 33778.0, 177569.0, 593018.0, 176965.0, 34001.0, 9641.0, 3396.0, 1550.0, 765.0, 464.0, 233.0, 183.0, 113.0, 70.0, 58.0, 34.0, 32.0, 19.0, 12.0, 14.0, 9.0, 2.0, 3.0, 5.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.3623046875, -0.35042572021484375, -0.3385467529296875, -0.32666778564453125, -0.314788818359375, -0.30290985107421875, -0.2910308837890625, -0.27915191650390625, -0.26727294921875, -0.25539398193359375, -0.2435150146484375, -0.23163604736328125, -0.219757080078125, -0.20787811279296875, -0.1959991455078125, -0.18412017822265625, -0.1722412109375, -0.16036224365234375, -0.1484832763671875, -0.13660430908203125, -0.124725341796875, -0.11284637451171875, -0.1009674072265625, -0.08908843994140625, -0.07720947265625, -0.06533050537109375, -0.0534515380859375, -0.04157257080078125, -0.029693603515625, -0.01781463623046875, -0.0059356689453125, 0.00594329833984375, 0.017822265625, 0.02970123291015625, 0.0415802001953125, 0.05345916748046875, 0.065338134765625, 0.07721710205078125, 0.0890960693359375, 0.10097503662109375, 0.11285400390625, 0.12473297119140625, 0.1366119384765625, 0.14849090576171875, 0.160369873046875, 0.17224884033203125, 0.1841278076171875, 0.19600677490234375, 0.2078857421875, 0.21976470947265625, 0.2316436767578125, 0.24352264404296875, 0.255401611328125, 0.26728057861328125, 0.2791595458984375, 0.29103851318359375, 0.30291748046875, 0.31479644775390625, 0.3266754150390625, 0.33855438232421875, 0.350433349609375, 0.36231231689453125, 0.3741912841796875, 0.38607025146484375, 0.39794921875]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 12.0, 8.0, 9.0, 23.0, 39.0, 36.0, 66.0, 84.0, 114.0, 96.0, 133.0, 101.0, 77.0, 77.0, 46.0, 26.0, 23.0, 14.0, 7.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1505126953125, -0.14550209045410156, -0.14049148559570312, -0.1354808807373047, -0.13047027587890625, -0.1254596710205078, -0.12044906616210938, -0.11543846130371094, -0.1104278564453125, -0.10541725158691406, -0.10040664672851562, -0.09539604187011719, -0.09038543701171875, -0.08537483215332031, -0.08036422729492188, -0.07535362243652344, -0.070343017578125, -0.06533241271972656, -0.060321807861328125, -0.05531120300292969, -0.05030059814453125, -0.04528999328613281, -0.040279388427734375, -0.03526878356933594, -0.0302581787109375, -0.025247573852539062, -0.020236968994140625, -0.015226364135742188, -0.01021575927734375, -0.0052051544189453125, -0.000194549560546875, 0.0048160552978515625, 0.00982666015625, 0.014837265014648438, 0.019847869873046875, 0.024858474731445312, 0.02986907958984375, 0.03487968444824219, 0.039890289306640625, 0.04490089416503906, 0.0499114990234375, 0.05492210388183594, 0.059932708740234375, 0.06494331359863281, 0.06995391845703125, 0.07496452331542969, 0.07997512817382812, 0.08498573303222656, 0.089996337890625, 0.09500694274902344, 0.10001754760742188, 0.10502815246582031, 0.11003875732421875, 0.11504936218261719, 0.12005996704101562, 0.12507057189941406, 0.1300811767578125, 0.13509178161621094, 0.14010238647460938, 0.1451129913330078, 0.15012359619140625, 0.1551342010498047, 0.16014480590820312, 0.16515541076660156, 0.170166015625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 13.0, 8.0, 12.0, 13.0, 20.0, 30.0, 46.0, 43.0, 63.0, 102.0, 136.0, 178.0, 276.0, 493.0, 742.0, 1422.0, 2668.0, 5632.0, 12721.0, 33439.0, 104741.0, 352142.0, 363012.0, 110387.0, 34658.0, 13466.0, 5795.0, 2736.0, 1403.0, 774.0, 434.0, 297.0, 173.0, 135.0, 93.0, 70.0, 54.0, 34.0, 25.0, 17.0, 12.0, 8.0, 4.0, 6.0, 8.0, 6.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.2548828125, -0.24666595458984375, -0.2384490966796875, -0.23023223876953125, -0.222015380859375, -0.21379852294921875, -0.2055816650390625, -0.19736480712890625, -0.18914794921875, -0.18093109130859375, -0.1727142333984375, -0.16449737548828125, -0.156280517578125, -0.14806365966796875, -0.1398468017578125, -0.13162994384765625, -0.1234130859375, -0.11519622802734375, -0.1069793701171875, -0.09876251220703125, -0.090545654296875, -0.08232879638671875, -0.0741119384765625, -0.06589508056640625, -0.05767822265625, -0.04946136474609375, -0.0412445068359375, -0.03302764892578125, -0.024810791015625, -0.01659393310546875, -0.0083770751953125, -0.00016021728515625, 0.008056640625, 0.01627349853515625, 0.0244903564453125, 0.03270721435546875, 0.040924072265625, 0.04914093017578125, 0.0573577880859375, 0.06557464599609375, 0.07379150390625, 0.08200836181640625, 0.0902252197265625, 0.09844207763671875, 0.106658935546875, 0.11487579345703125, 0.1230926513671875, 0.13130950927734375, 0.1395263671875, 0.14774322509765625, 0.1559600830078125, 0.16417694091796875, 0.172393798828125, 0.18061065673828125, 0.1888275146484375, 0.19704437255859375, 0.20526123046875, 0.21347808837890625, 0.2216949462890625, 0.22991180419921875, 0.238128662109375, 0.24634552001953125, 0.2545623779296875, 0.26277923583984375, 0.27099609375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 4.0, 2.0, 8.0, 8.0, 6.0, 7.0, 8.0, 9.0, 7.0, 21.0, 23.0, 23.0, 34.0, 31.0, 34.0, 33.0, 32.0, 39.0, 52.0, 61.0, 46.0, 54.0, 45.0, 44.0, 42.0, 42.0, 39.0, 35.0, 35.0, 22.0, 26.0, 20.0, 25.0, 14.0, 12.0, 16.0, 8.0, 9.0, 7.0, 6.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.353515625, -0.3412284851074219, -0.32894134521484375, -0.3166542053222656, -0.3043670654296875, -0.2920799255371094, -0.27979278564453125, -0.2675056457519531, -0.255218505859375, -0.24293136596679688, -0.23064422607421875, -0.21835708618164062, -0.2060699462890625, -0.19378280639648438, -0.18149566650390625, -0.16920852661132812, -0.15692138671875, -0.14463424682617188, -0.13234710693359375, -0.12005996704101562, -0.1077728271484375, -0.09548568725585938, -0.08319854736328125, -0.07091140747070312, -0.058624267578125, -0.046337127685546875, -0.03404998779296875, -0.021762847900390625, -0.0094757080078125, 0.002811431884765625, 0.01509857177734375, 0.027385711669921875, 0.0396728515625, 0.051959991455078125, 0.06424713134765625, 0.07653427124023438, 0.0888214111328125, 0.10110855102539062, 0.11339569091796875, 0.12568283081054688, 0.137969970703125, 0.15025711059570312, 0.16254425048828125, 0.17483139038085938, 0.1871185302734375, 0.19940567016601562, 0.21169281005859375, 0.22397994995117188, 0.23626708984375, 0.24855422973632812, 0.26084136962890625, 0.2731285095214844, 0.2854156494140625, 0.2977027893066406, 0.30998992919921875, 0.3222770690917969, 0.334564208984375, 0.3468513488769531, 0.35913848876953125, 0.3714256286621094, 0.3837127685546875, 0.3959999084472656, 0.40828704833984375, 0.4205741882324219, 0.432861328125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 7.0, 6.0, 7.0, 23.0, 68.0, 162.0, 629.0, 4230.0, 108011.0, 888239.0, 43986.0, 2514.0, 450.0, 136.0, 44.0, 26.0, 11.0, 3.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13525390625, -0.12827682495117188, -0.12129974365234375, -0.11432266235351562, -0.1073455810546875, -0.10036849975585938, -0.09339141845703125, -0.08641433715820312, -0.079437255859375, -0.07246017456054688, -0.06548309326171875, -0.058506011962890625, -0.0515289306640625, -0.044551849365234375, -0.03757476806640625, -0.030597686767578125, -0.02362060546875, -0.016643524169921875, -0.00966644287109375, -0.002689361572265625, 0.0042877197265625, 0.011264801025390625, 0.01824188232421875, 0.025218963623046875, 0.032196044921875, 0.039173126220703125, 0.04615020751953125, 0.053127288818359375, 0.0601043701171875, 0.06708145141601562, 0.07405853271484375, 0.08103561401367188, 0.0880126953125, 0.09498977661132812, 0.10196685791015625, 0.10894393920898438, 0.1159210205078125, 0.12289810180664062, 0.12987518310546875, 0.13685226440429688, 0.143829345703125, 0.15080642700195312, 0.15778350830078125, 0.16476058959960938, 0.1717376708984375, 0.17871475219726562, 0.18569183349609375, 0.19266891479492188, 0.19964599609375, 0.20662307739257812, 0.21360015869140625, 0.22057723999023438, 0.2275543212890625, 0.23453140258789062, 0.24150848388671875, 0.24848556518554688, 0.255462646484375, 0.2624397277832031, 0.26941680908203125, 0.2763938903808594, 0.2833709716796875, 0.2903480529785156, 0.29732513427734375, 0.3043022155761719, 0.311279296875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 1.0, 5.0, 3.0, 5.0, 8.0, 7.0, 5.0, 16.0, 10.0, 21.0, 17.0, 21.0, 43.0, 53.0, 78.0, 96.0, 111.0, 113.0, 89.0, 63.0, 63.0, 33.0, 20.0, 31.0, 15.0, 7.0, 10.0, 9.0, 12.0, 10.0, 5.0, 3.0, 6.0, 4.0, 2.0, 5.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0], "bins": [-0.00010967254638671875, -0.00010677520185709, -0.00010387785732746124, -0.00010098051279783249, -9.808316826820374e-05, -9.518582373857498e-05, -9.228847920894623e-05, -8.939113467931747e-05, -8.649379014968872e-05, -8.359644562005997e-05, -8.069910109043121e-05, -7.780175656080246e-05, -7.49044120311737e-05, -7.200706750154495e-05, -6.91097229719162e-05, -6.621237844228745e-05, -6.331503391265869e-05, -6.041768938302994e-05, -5.7520344853401184e-05, -5.462300032377243e-05, -5.172565579414368e-05, -4.882831126451492e-05, -4.593096673488617e-05, -4.3033622205257416e-05, -4.013627767562866e-05, -3.723893314599991e-05, -3.4341588616371155e-05, -3.14442440867424e-05, -2.8546899557113647e-05, -2.5649555027484894e-05, -2.275221049785614e-05, -1.9854865968227386e-05, -1.6957521438598633e-05, -1.4060176908969879e-05, -1.1162832379341125e-05, -8.265487849712372e-06, -5.368143320083618e-06, -2.4707987904548645e-06, 4.2654573917388916e-07, 3.323890268802643e-06, 6.2212347984313965e-06, 9.11857932806015e-06, 1.2015923857688904e-05, 1.4913268387317657e-05, 1.781061291694641e-05, 2.0707957446575165e-05, 2.360530197620392e-05, 2.6502646505832672e-05, 2.9399991035461426e-05, 3.229733556509018e-05, 3.519468009471893e-05, 3.809202462434769e-05, 4.098936915397644e-05, 4.3886713683605194e-05, 4.678405821323395e-05, 4.96814027428627e-05, 5.2578747272491455e-05, 5.547609180212021e-05, 5.837343633174896e-05, 6.127078086137772e-05, 6.416812539100647e-05, 6.706546992063522e-05, 6.996281445026398e-05, 7.286015897989273e-05, 7.575750350952148e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 12.0, 23.0, 26.0, 20.0, 61.0, 89.0, 159.0, 417.0, 1098.0, 4066.0, 31315.0, 528517.0, 450750.0, 26588.0, 3614.0, 1023.0, 370.0, 186.0, 83.0, 45.0, 30.0, 23.0, 13.0, 14.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.2215576171875, -0.21614933013916016, -0.2107410430908203, -0.20533275604248047, -0.19992446899414062, -0.19451618194580078, -0.18910789489746094, -0.1836996078491211, -0.17829132080078125, -0.1728830337524414, -0.16747474670410156, -0.16206645965576172, -0.15665817260742188, -0.15124988555908203, -0.1458415985107422, -0.14043331146240234, -0.1350250244140625, -0.12961673736572266, -0.12420845031738281, -0.11880016326904297, -0.11339187622070312, -0.10798358917236328, -0.10257530212402344, -0.0971670150756836, -0.09175872802734375, -0.0863504409790039, -0.08094215393066406, -0.07553386688232422, -0.07012557983398438, -0.06471729278564453, -0.05930900573730469, -0.053900718688964844, -0.048492431640625, -0.043084144592285156, -0.03767585754394531, -0.03226757049560547, -0.026859283447265625, -0.02145099639892578, -0.016042709350585938, -0.010634422302246094, -0.00522613525390625, 0.00018215179443359375, 0.0055904388427734375, 0.010998725891113281, 0.016407012939453125, 0.02181529998779297, 0.027223587036132812, 0.032631874084472656, 0.0380401611328125, 0.043448448181152344, 0.04885673522949219, 0.05426502227783203, 0.059673309326171875, 0.06508159637451172, 0.07048988342285156, 0.0758981704711914, 0.08130645751953125, 0.0867147445678711, 0.09212303161621094, 0.09753131866455078, 0.10293960571289062, 0.10834789276123047, 0.11375617980957031, 0.11916446685791016, 0.12457275390625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 4.0, 9.0, 14.0, 35.0, 68.0, 133.0, 176.0, 187.0, 168.0, 92.0, 62.0, 25.0, 16.0, 11.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.285400390625, -0.27924633026123047, -0.27309226989746094, -0.2669382095336914, -0.2607841491699219, -0.25463008880615234, -0.2484760284423828, -0.24232196807861328, -0.23616790771484375, -0.23001384735107422, -0.2238597869873047, -0.21770572662353516, -0.21155166625976562, -0.2053976058959961, -0.19924354553222656, -0.19308948516845703, -0.1869354248046875, -0.18078136444091797, -0.17462730407714844, -0.1684732437133789, -0.16231918334960938, -0.15616512298583984, -0.1500110626220703, -0.14385700225830078, -0.13770294189453125, -0.13154888153076172, -0.1253948211669922, -0.11924076080322266, -0.11308670043945312, -0.1069326400756836, -0.10077857971191406, -0.09462451934814453, -0.088470458984375, -0.08231639862060547, -0.07616233825683594, -0.0700082778930664, -0.06385421752929688, -0.057700157165527344, -0.05154609680175781, -0.04539203643798828, -0.03923797607421875, -0.03308391571044922, -0.026929855346679688, -0.020775794982910156, -0.014621734619140625, -0.008467674255371094, -0.0023136138916015625, 0.0038404464721679688, 0.0099945068359375, 0.01614856719970703, 0.022302627563476562, 0.028456687927246094, 0.034610748291015625, 0.040764808654785156, 0.04691886901855469, 0.05307292938232422, 0.05922698974609375, 0.06538105010986328, 0.07153511047363281, 0.07768917083740234, 0.08384323120117188, 0.0899972915649414, 0.09615135192871094, 0.10230541229248047, 0.10845947265625]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 8.0, 6.0, 10.0, 19.0, 29.0, 61.0, 86.0, 130.0, 177.0, 171.0, 132.0, 61.0, 44.0, 28.0, 12.0, 8.0, 7.0, 10.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2139188051223755, -1.1486256122589111, -1.0833325386047363, -1.018039345741272, -0.9527461528778076, -0.8874529600143433, -0.8221598267555237, -0.7568666934967041, -0.6915735006332397, -0.6262803077697754, -0.5609871745109558, -0.49569401144981384, -0.4304008483886719, -0.3651076853275299, -0.29981452226638794, -0.23452135920524597, -0.169228196144104, -0.10393503308296204, -0.03864187002182007, 0.0266512930393219, 0.09194445610046387, 0.15723761916160583, 0.2225307822227478, 0.28782394528388977, 0.35311710834503174, 0.4184102714061737, 0.4837034344673157, 0.5489965677261353, 0.6142897605895996, 0.679582953453064, 0.7448760867118835, 0.8101692199707031, 0.875462532043457, 0.9407557249069214, 1.0060489177703857, 1.0713419914245605, 1.136635184288025, 1.2019283771514893, 1.267221450805664, 1.3325146436691284, 1.3978078365325928, 1.4631010293960571, 1.5283942222595215, 1.5936872959136963, 1.6589804887771606, 1.724273681640625, 1.7895667552947998, 1.8548599481582642, 1.9201531410217285, 1.9854463338851929, 2.0507395267486572, 2.116032600402832, 2.181325912475586, 2.2466189861297607, 2.3119120597839355, 2.3772053718566895, 2.4424984455108643, 2.507791519165039, 2.573084831237793, 2.6383779048919678, 2.7036709785461426, 2.7689642906188965, 2.8342573642730713, 2.899550676345825, 2.96484375]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 11.0, 11.0, 9.0, 6.0, 13.0, 25.0, 21.0, 32.0, 29.0, 30.0, 53.0, 49.0, 60.0, 60.0, 55.0, 83.0, 56.0, 61.0, 55.0, 40.0, 48.0, 33.0, 36.0, 24.0, 18.0, 25.0, 14.0, 15.0, 8.0, 9.0, 4.0, 2.0, 3.0, 5.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.435960054397583, -3.350484848022461, -3.265009880065918, -3.179534673690796, -3.094059467315674, -3.008584499359131, -2.923109292984009, -2.8376340866088867, -2.7521591186523438, -2.6666839122772217, -2.5812089443206787, -2.4957337379455566, -2.4102585315704346, -2.3247833251953125, -2.2393083572387695, -2.1538331508636475, -2.0683579444885254, -1.9828828573226929, -1.8974076509475708, -1.8119325637817383, -1.7264573574066162, -1.6409822702407837, -1.5555071830749512, -1.470031976699829, -1.3845568895339966, -1.299081802368164, -1.213606595993042, -1.1281315088272095, -1.042656421661377, -0.9571812152862549, -0.8717061281204224, -0.7862309813499451, -0.7007555961608887, -0.6152804493904114, -0.5298053026199341, -0.44433021545410156, -0.35885506868362427, -0.273379921913147, -0.18790483474731445, -0.10242968797683716, -0.016954541206359863, 0.06852059066295624, 0.15399572253227234, 0.23947083950042725, 0.32494598627090454, 0.41042113304138184, 0.49589622020721436, 0.5813713669776917, 0.666846513748169, 0.7523216605186462, 0.8377968072891235, 0.923271894454956, 1.0087471008300781, 1.0942221879959106, 1.1796972751617432, 1.2651724815368652, 1.3506475687026978, 1.4361226558685303, 1.5215978622436523, 1.6070729494094849, 1.6925480365753174, 1.7780232429504395, 1.863498330116272, 1.9489734172821045, 2.0344486236572266]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 10.0, 5.0, 10.0, 7.0, 16.0, 13.0, 35.0, 38.0, 68.0, 68.0, 127.0, 224.0, 389.0, 752.0, 1418.0, 3136.0, 8191.0, 32285.0, 398977.0, 3643523.0, 80888.0, 14847.0, 4782.0, 2006.0, 990.0, 532.0, 321.0, 206.0, 110.0, 83.0, 48.0, 43.0, 31.0, 22.0, 20.0, 11.0, 12.0, 7.0, 4.0, 12.0, 4.0, 0.0, 2.0, 2.0, 4.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.4423828125, -0.42725372314453125, -0.4121246337890625, -0.39699554443359375, -0.381866455078125, -0.36673736572265625, -0.3516082763671875, -0.33647918701171875, -0.32135009765625, -0.30622100830078125, -0.2910919189453125, -0.27596282958984375, -0.260833740234375, -0.24570465087890625, -0.2305755615234375, -0.21544647216796875, -0.2003173828125, -0.18518829345703125, -0.1700592041015625, -0.15493011474609375, -0.139801025390625, -0.12467193603515625, -0.1095428466796875, -0.09441375732421875, -0.07928466796875, -0.06415557861328125, -0.0490264892578125, -0.03389739990234375, -0.018768310546875, -0.00363922119140625, 0.0114898681640625, 0.02661895751953125, 0.041748046875, 0.05687713623046875, 0.0720062255859375, 0.08713531494140625, 0.102264404296875, 0.11739349365234375, 0.1325225830078125, 0.14765167236328125, 0.16278076171875, 0.17790985107421875, 0.1930389404296875, 0.20816802978515625, 0.223297119140625, 0.23842620849609375, 0.2535552978515625, 0.26868438720703125, 0.2838134765625, 0.29894256591796875, 0.3140716552734375, 0.32920074462890625, 0.344329833984375, 0.35945892333984375, 0.3745880126953125, 0.38971710205078125, 0.40484619140625, 0.41997528076171875, 0.4351043701171875, 0.45023345947265625, 0.465362548828125, 0.48049163818359375, 0.4956207275390625, 0.5107498168945312, 0.52587890625]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 5.0, 7.0, 13.0, 25.0, 32.0, 36.0, 50.0, 50.0, 100.0, 100.0, 97.0, 96.0, 108.0, 86.0, 47.0, 34.0, 39.0, 22.0, 18.0, 11.0, 7.0, 6.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1312255859375, -0.1266632080078125, -0.122100830078125, -0.1175384521484375, -0.11297607421875, -0.1084136962890625, -0.103851318359375, -0.0992889404296875, -0.0947265625, -0.0901641845703125, -0.085601806640625, -0.0810394287109375, -0.07647705078125, -0.0719146728515625, -0.067352294921875, -0.0627899169921875, -0.0582275390625, -0.0536651611328125, -0.049102783203125, -0.0445404052734375, -0.03997802734375, -0.0354156494140625, -0.030853271484375, -0.0262908935546875, -0.021728515625, -0.0171661376953125, -0.012603759765625, -0.0080413818359375, -0.00347900390625, 0.0010833740234375, 0.005645751953125, 0.0102081298828125, 0.0147705078125, 0.0193328857421875, 0.023895263671875, 0.0284576416015625, 0.03302001953125, 0.0375823974609375, 0.042144775390625, 0.0467071533203125, 0.05126953125, 0.0558319091796875, 0.060394287109375, 0.0649566650390625, 0.06951904296875, 0.0740814208984375, 0.078643798828125, 0.0832061767578125, 0.0877685546875, 0.0923309326171875, 0.096893310546875, 0.1014556884765625, 0.10601806640625, 0.1105804443359375, 0.115142822265625, 0.1197052001953125, 0.124267578125, 0.1288299560546875, 0.133392333984375, 0.1379547119140625, 0.14251708984375, 0.1470794677734375, 0.151641845703125, 0.1562042236328125, 0.1607666015625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 8.0, 7.0, 10.0, 15.0, 23.0, 49.0, 74.0, 96.0, 170.0, 300.0, 531.0, 966.0, 1808.0, 3871.0, 10017.0, 44853.0, 695212.0, 3299438.0, 108305.0, 18161.0, 5490.0, 2301.0, 1132.0, 570.0, 334.0, 205.0, 120.0, 57.0, 42.0, 36.0, 27.0, 17.0, 10.0, 9.0, 6.0, 7.0, 5.0, 2.0, 1.0, 3.0], "bins": [-0.42333984375, -0.41306495666503906, -0.4027900695800781, -0.3925151824951172, -0.38224029541015625, -0.3719654083251953, -0.3616905212402344, -0.35141563415527344, -0.3411407470703125, -0.33086585998535156, -0.3205909729003906, -0.3103160858154297, -0.30004119873046875, -0.2897663116455078, -0.2794914245605469, -0.26921653747558594, -0.258941650390625, -0.24866676330566406, -0.23839187622070312, -0.2281169891357422, -0.21784210205078125, -0.2075672149658203, -0.19729232788085938, -0.18701744079589844, -0.1767425537109375, -0.16646766662597656, -0.15619277954101562, -0.1459178924560547, -0.13564300537109375, -0.1253681182861328, -0.11509323120117188, -0.10481834411621094, -0.09454345703125, -0.08426856994628906, -0.07399368286132812, -0.06371879577636719, -0.05344390869140625, -0.04316902160644531, -0.032894134521484375, -0.022619247436523438, -0.0123443603515625, -0.0020694732666015625, 0.008205413818359375, 0.018480300903320312, 0.02875518798828125, 0.03903007507324219, 0.049304962158203125, 0.05957984924316406, 0.069854736328125, 0.08012962341308594, 0.09040451049804688, 0.10067939758300781, 0.11095428466796875, 0.12122917175292969, 0.13150405883789062, 0.14177894592285156, 0.1520538330078125, 0.16232872009277344, 0.17260360717773438, 0.1828784942626953, 0.19315338134765625, 0.2034282684326172, 0.21370315551757812, 0.22397804260253906, 0.2342529296875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 4.0, 8.0, 9.0, 6.0, 16.0, 32.0, 71.0, 139.0, 341.0, 1633.0, 1219.0, 312.0, 119.0, 59.0, 40.0, 20.0, 18.0, 5.0, 15.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.20947265625, -0.20246315002441406, -0.19545364379882812, -0.1884441375732422, -0.18143463134765625, -0.1744251251220703, -0.16741561889648438, -0.16040611267089844, -0.1533966064453125, -0.14638710021972656, -0.13937759399414062, -0.1323680877685547, -0.12535858154296875, -0.11834907531738281, -0.11133956909179688, -0.10433006286621094, -0.097320556640625, -0.09031105041503906, -0.08330154418945312, -0.07629203796386719, -0.06928253173828125, -0.06227302551269531, -0.055263519287109375, -0.04825401306152344, -0.0412445068359375, -0.03423500061035156, -0.027225494384765625, -0.020215988159179688, -0.01320648193359375, -0.0061969757080078125, 0.000812530517578125, 0.007822036743164062, 0.01483154296875, 0.021841049194335938, 0.028850555419921875, 0.03586006164550781, 0.04286956787109375, 0.04987907409667969, 0.056888580322265625, 0.06389808654785156, 0.0709075927734375, 0.07791709899902344, 0.08492660522460938, 0.09193611145019531, 0.09894561767578125, 0.10595512390136719, 0.11296463012695312, 0.11997413635253906, 0.126983642578125, 0.13399314880371094, 0.14100265502929688, 0.1480121612548828, 0.15502166748046875, 0.1620311737060547, 0.16904067993164062, 0.17605018615722656, 0.1830596923828125, 0.19006919860839844, 0.19707870483398438, 0.2040882110595703, 0.21109771728515625, 0.2181072235107422, 0.22511672973632812, 0.23212623596191406, 0.2391357421875]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 6.0, 10.0, 9.0, 29.0, 67.0, 130.0, 217.0, 223.0, 159.0, 94.0, 35.0, 10.0, 7.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8653675317764282, -0.8305153846740723, -0.7956632375717163, -0.7608110308647156, -0.7259588837623596, -0.6911067366600037, -0.6562545299530029, -0.621402382850647, -0.586550235748291, -0.5516980886459351, -0.5168459415435791, -0.48199373483657837, -0.4471415877342224, -0.41228944063186646, -0.3774372637271881, -0.34258508682250977, -0.3077329397201538, -0.27288079261779785, -0.2380286157131195, -0.20317645370960236, -0.1683242917060852, -0.13347212970256805, -0.0986199676990509, -0.06376780569553375, -0.0289156436920166, 0.005936518311500549, 0.0407886803150177, 0.07564084231853485, 0.110493004322052, 0.14534516632556915, 0.1801973283290863, 0.21504949033260345, 0.24990177154541016, 0.2847539186477661, 0.31960609555244446, 0.3544582724571228, 0.38931041955947876, 0.4241625666618347, 0.45901474356651306, 0.4938669204711914, 0.5287190675735474, 0.5635712146759033, 0.5984233617782593, 0.63327556848526, 0.668127715587616, 0.7029798626899719, 0.7378320693969727, 0.7726842164993286, 0.8075363636016846, 0.8423885107040405, 0.8772406578063965, 0.9120928645133972, 0.9469450116157532, 0.9817971587181091, 1.0166493654251099, 1.0515015125274658, 1.0863536596298218, 1.1212058067321777, 1.1560579538345337, 1.1909101009368896, 1.2257623672485352, 1.2606145143508911, 1.295466661453247, 1.330318808555603, 1.365170955657959]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 7.0, 5.0, 7.0, 14.0, 17.0, 21.0, 25.0, 29.0, 52.0, 52.0, 70.0, 63.0, 62.0, 76.0, 78.0, 77.0, 77.0, 42.0, 49.0, 42.0, 42.0, 25.0, 18.0, 19.0, 11.0, 12.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6058604121208191, -0.5822413563728333, -0.5586223602294922, -0.5350033044815063, -0.5113843083381653, -0.48776525259017944, -0.464146226644516, -0.44052720069885254, -0.4169081449508667, -0.39328911900520325, -0.3696700930595398, -0.34605103731155396, -0.3224320113658905, -0.29881298542022705, -0.2751939594745636, -0.25157493352890015, -0.2279559075832367, -0.20433688163757324, -0.1807178407907486, -0.15709881484508514, -0.1334797739982605, -0.10986074805259705, -0.0862417221069336, -0.06262268126010895, -0.039003655314445496, -0.015384623780846596, 0.008234407752752304, 0.031853437423706055, 0.055472470819950104, 0.07909150421619415, 0.1027105301618576, 0.12632957100868225, 0.1499485969543457, 0.17356762290000916, 0.1971866637468338, 0.22080568969249725, 0.2444247305393219, 0.26804375648498535, 0.2916627824306488, 0.31528180837631226, 0.3389008641242981, 0.36251989006996155, 0.386138916015625, 0.40975797176361084, 0.4333769977092743, 0.45699602365493774, 0.4806150496006012, 0.5042340755462646, 0.5278531312942505, 0.5514721870422363, 0.5750911831855774, 0.5987102389335632, 0.6223292350769043, 0.6459482908248901, 0.669567346572876, 0.693186342716217, 0.7168053388595581, 0.740424394607544, 0.764043390750885, 0.7876624464988708, 0.8112814426422119, 0.8349004983901978, 0.8585195541381836, 0.8821385502815247, 0.9057576060295105]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 8.0, 10.0, 14.0, 24.0, 58.0, 72.0, 138.0, 303.0, 685.0, 1713.0, 5988.0, 42290.0, 679861.0, 291914.0, 19424.0, 3742.0, 1228.0, 522.0, 274.0, 136.0, 60.0, 27.0, 17.0, 12.0, 11.0, 9.0, 4.0, 4.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.79052734375, -0.7678298950195312, -0.7451324462890625, -0.7224349975585938, -0.699737548828125, -0.6770401000976562, -0.6543426513671875, -0.6316452026367188, -0.60894775390625, -0.5862503051757812, -0.5635528564453125, -0.5408554077148438, -0.518157958984375, -0.49546051025390625, -0.4727630615234375, -0.45006561279296875, -0.4273681640625, -0.40467071533203125, -0.3819732666015625, -0.35927581787109375, -0.336578369140625, -0.31388092041015625, -0.2911834716796875, -0.26848602294921875, -0.24578857421875, -0.22309112548828125, -0.2003936767578125, -0.17769622802734375, -0.154998779296875, -0.13230133056640625, -0.1096038818359375, -0.08690643310546875, -0.064208984375, -0.04151153564453125, -0.0188140869140625, 0.00388336181640625, 0.026580810546875, 0.04927825927734375, 0.0719757080078125, 0.09467315673828125, 0.11737060546875, 0.14006805419921875, 0.1627655029296875, 0.18546295166015625, 0.208160400390625, 0.23085784912109375, 0.2535552978515625, 0.27625274658203125, 0.2989501953125, 0.32164764404296875, 0.3443450927734375, 0.36704254150390625, 0.389739990234375, 0.41243743896484375, 0.4351348876953125, 0.45783233642578125, 0.48052978515625, 0.5032272338867188, 0.5259246826171875, 0.5486221313476562, 0.571319580078125, 0.5940170288085938, 0.6167144775390625, 0.6394119262695312, 0.662109375]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 3.0, 8.0, 14.0, 21.0, 21.0, 54.0, 56.0, 60.0, 92.0, 122.0, 119.0, 104.0, 117.0, 59.0, 45.0, 38.0, 28.0, 10.0, 7.0, 12.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12030029296875, -0.11536312103271484, -0.11042594909667969, -0.10548877716064453, -0.10055160522460938, -0.09561443328857422, -0.09067726135253906, -0.0857400894165039, -0.08080291748046875, -0.0758657455444336, -0.07092857360839844, -0.06599140167236328, -0.061054229736328125, -0.05611705780029297, -0.05117988586425781, -0.046242713928222656, -0.0413055419921875, -0.036368370056152344, -0.03143119812011719, -0.02649402618408203, -0.021556854248046875, -0.01661968231201172, -0.011682510375976562, -0.006745338439941406, -0.00180816650390625, 0.0031290054321289062, 0.008066177368164062, 0.013003349304199219, 0.017940521240234375, 0.02287769317626953, 0.027814865112304688, 0.032752037048339844, 0.037689208984375, 0.042626380920410156, 0.04756355285644531, 0.05250072479248047, 0.057437896728515625, 0.06237506866455078, 0.06731224060058594, 0.0722494125366211, 0.07718658447265625, 0.0821237564086914, 0.08706092834472656, 0.09199810028076172, 0.09693527221679688, 0.10187244415283203, 0.10680961608886719, 0.11174678802490234, 0.1166839599609375, 0.12162113189697266, 0.1265583038330078, 0.13149547576904297, 0.13643264770507812, 0.14136981964111328, 0.14630699157714844, 0.1512441635131836, 0.15618133544921875, 0.1611185073852539, 0.16605567932128906, 0.17099285125732422, 0.17593002319335938, 0.18086719512939453, 0.1858043670654297, 0.19074153900146484, 0.1956787109375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 4.0, 3.0, 10.0, 18.0, 23.0, 46.0, 95.0, 162.0, 295.0, 677.0, 1594.0, 4427.0, 14306.0, 57077.0, 280408.0, 512205.0, 134802.0, 29525.0, 8127.0, 2746.0, 1041.0, 433.0, 217.0, 144.0, 82.0, 36.0, 28.0, 10.0, 7.0, 1.0, 6.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.24658203125, -0.23642349243164062, -0.22626495361328125, -0.21610641479492188, -0.2059478759765625, -0.19578933715820312, -0.18563079833984375, -0.17547225952148438, -0.165313720703125, -0.15515518188476562, -0.14499664306640625, -0.13483810424804688, -0.1246795654296875, -0.11452102661132812, -0.10436248779296875, -0.09420394897460938, -0.08404541015625, -0.07388687133789062, -0.06372833251953125, -0.053569793701171875, -0.0434112548828125, -0.033252716064453125, -0.02309417724609375, -0.012935638427734375, -0.002777099609375, 0.007381439208984375, 0.01753997802734375, 0.027698516845703125, 0.0378570556640625, 0.048015594482421875, 0.05817413330078125, 0.06833267211914062, 0.0784912109375, 0.08864974975585938, 0.09880828857421875, 0.10896682739257812, 0.1191253662109375, 0.12928390502929688, 0.13944244384765625, 0.14960098266601562, 0.159759521484375, 0.16991806030273438, 0.18007659912109375, 0.19023513793945312, 0.2003936767578125, 0.21055221557617188, 0.22071075439453125, 0.23086929321289062, 0.24102783203125, 0.2511863708496094, 0.26134490966796875, 0.2715034484863281, 0.2816619873046875, 0.2918205261230469, 0.30197906494140625, 0.3121376037597656, 0.322296142578125, 0.3324546813964844, 0.34261322021484375, 0.3527717590332031, 0.3629302978515625, 0.3730888366699219, 0.38324737548828125, 0.3934059143066406, 0.403564453125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 8.0, 2.0, 6.0, 7.0, 9.0, 5.0, 11.0, 16.0, 21.0, 18.0, 37.0, 23.0, 29.0, 27.0, 43.0, 30.0, 39.0, 43.0, 29.0, 51.0, 33.0, 44.0, 41.0, 43.0, 32.0, 43.0, 34.0, 35.0, 39.0, 33.0, 27.0, 23.0, 23.0, 18.0, 16.0, 8.0, 11.0, 9.0, 8.0, 11.0, 5.0, 7.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-0.363525390625, -0.35344696044921875, -0.3433685302734375, -0.33329010009765625, -0.323211669921875, -0.31313323974609375, -0.3030548095703125, -0.29297637939453125, -0.28289794921875, -0.27281951904296875, -0.2627410888671875, -0.25266265869140625, -0.242584228515625, -0.23250579833984375, -0.2224273681640625, -0.21234893798828125, -0.2022705078125, -0.19219207763671875, -0.1821136474609375, -0.17203521728515625, -0.161956787109375, -0.15187835693359375, -0.1417999267578125, -0.13172149658203125, -0.12164306640625, -0.11156463623046875, -0.1014862060546875, -0.09140777587890625, -0.081329345703125, -0.07125091552734375, -0.0611724853515625, -0.05109405517578125, -0.041015625, -0.03093719482421875, -0.0208587646484375, -0.01078033447265625, -0.000701904296875, 0.00937652587890625, 0.0194549560546875, 0.02953338623046875, 0.03961181640625, 0.04969024658203125, 0.0597686767578125, 0.06984710693359375, 0.079925537109375, 0.09000396728515625, 0.1000823974609375, 0.11016082763671875, 0.1202392578125, 0.13031768798828125, 0.1403961181640625, 0.15047454833984375, 0.160552978515625, 0.17063140869140625, 0.1807098388671875, 0.19078826904296875, 0.20086669921875, 0.21094512939453125, 0.2210235595703125, 0.23110198974609375, 0.241180419921875, 0.25125885009765625, 0.2613372802734375, 0.27141571044921875, 0.281494140625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 8.0, 2.0, 7.0, 13.0, 34.0, 85.0, 255.0, 1356.0, 40854.0, 988510.0, 16152.0, 963.0, 201.0, 71.0, 22.0, 12.0, 4.0, 7.0, 5.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.427490234375, -0.41574859619140625, -0.4040069580078125, -0.39226531982421875, -0.380523681640625, -0.36878204345703125, -0.3570404052734375, -0.34529876708984375, -0.33355712890625, -0.32181549072265625, -0.3100738525390625, -0.29833221435546875, -0.286590576171875, -0.27484893798828125, -0.2631072998046875, -0.25136566162109375, -0.2396240234375, -0.22788238525390625, -0.2161407470703125, -0.20439910888671875, -0.192657470703125, -0.18091583251953125, -0.1691741943359375, -0.15743255615234375, -0.14569091796875, -0.13394927978515625, -0.1222076416015625, -0.11046600341796875, -0.098724365234375, -0.08698272705078125, -0.0752410888671875, -0.06349945068359375, -0.0517578125, -0.04001617431640625, -0.0282745361328125, -0.01653289794921875, -0.004791259765625, 0.00695037841796875, 0.0186920166015625, 0.03043365478515625, 0.04217529296875, 0.05391693115234375, 0.0656585693359375, 0.07740020751953125, 0.089141845703125, 0.10088348388671875, 0.1126251220703125, 0.12436676025390625, 0.1361083984375, 0.14785003662109375, 0.1595916748046875, 0.17133331298828125, 0.183074951171875, 0.19481658935546875, 0.2065582275390625, 0.21829986572265625, 0.23004150390625, 0.24178314208984375, 0.2535247802734375, 0.26526641845703125, 0.277008056640625, 0.28874969482421875, 0.3004913330078125, 0.31223297119140625, 0.323974609375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 2.0, 7.0, 4.0, 11.0, 9.0, 11.0, 7.0, 16.0, 20.0, 20.0, 26.0, 40.0, 65.0, 78.0, 125.0, 134.0, 116.0, 73.0, 45.0, 44.0, 29.0, 20.0, 22.0, 18.0, 14.0, 12.0, 9.0, 8.0, 2.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00011581182479858398, -0.00011294335126876831, -0.00011007487773895264, -0.00010720640420913696, -0.00010433793067932129, -0.00010146945714950562, -9.860098361968994e-05, -9.573251008987427e-05, -9.28640365600586e-05, -8.999556303024292e-05, -8.712708950042725e-05, -8.425861597061157e-05, -8.13901424407959e-05, -7.852166891098022e-05, -7.565319538116455e-05, -7.278472185134888e-05, -6.99162483215332e-05, -6.704777479171753e-05, -6.417930126190186e-05, -6.131082773208618e-05, -5.844235420227051e-05, -5.5573880672454834e-05, -5.270540714263916e-05, -4.9836933612823486e-05, -4.696846008300781e-05, -4.409998655319214e-05, -4.1231513023376465e-05, -3.836303949356079e-05, -3.549456596374512e-05, -3.262609243392944e-05, -2.975761890411377e-05, -2.6889145374298096e-05, -2.4020671844482422e-05, -2.1152198314666748e-05, -1.8283724784851074e-05, -1.54152512550354e-05, -1.2546777725219727e-05, -9.678304195404053e-06, -6.809830665588379e-06, -3.941357135772705e-06, -1.0728836059570312e-06, 1.7955899238586426e-06, 4.664063453674316e-06, 7.53253698348999e-06, 1.0401010513305664e-05, 1.3269484043121338e-05, 1.6137957572937012e-05, 1.9006431102752686e-05, 2.187490463256836e-05, 2.4743378162384033e-05, 2.7611851692199707e-05, 3.048032522201538e-05, 3.3348798751831055e-05, 3.621727228164673e-05, 3.90857458114624e-05, 4.1954219341278076e-05, 4.482269287109375e-05, 4.7691166400909424e-05, 5.05596399307251e-05, 5.342811346054077e-05, 5.6296586990356445e-05, 5.916506052017212e-05, 6.203353404998779e-05, 6.490200757980347e-05, 6.777048110961914e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 5.0, 6.0, 7.0, 8.0, 9.0, 15.0, 44.0, 104.0, 321.0, 1030.0, 4782.0, 58098.0, 876229.0, 99484.0, 6535.0, 1275.0, 367.0, 121.0, 57.0, 19.0, 14.0, 15.0, 7.0, 6.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2401123046875, -0.23296165466308594, -0.22581100463867188, -0.2186603546142578, -0.21150970458984375, -0.2043590545654297, -0.19720840454101562, -0.19005775451660156, -0.1829071044921875, -0.17575645446777344, -0.16860580444335938, -0.1614551544189453, -0.15430450439453125, -0.1471538543701172, -0.14000320434570312, -0.13285255432128906, -0.125701904296875, -0.11855125427246094, -0.11140060424804688, -0.10424995422363281, -0.09709930419921875, -0.08994865417480469, -0.08279800415039062, -0.07564735412597656, -0.0684967041015625, -0.06134605407714844, -0.054195404052734375, -0.04704475402832031, -0.03989410400390625, -0.03274345397949219, -0.025592803955078125, -0.018442153930664062, -0.01129150390625, -0.0041408538818359375, 0.003009796142578125, 0.010160446166992188, 0.01731109619140625, 0.024461746215820312, 0.031612396240234375, 0.03876304626464844, 0.0459136962890625, 0.05306434631347656, 0.060214996337890625, 0.06736564636230469, 0.07451629638671875, 0.08166694641113281, 0.08881759643554688, 0.09596824645996094, 0.103118896484375, 0.11026954650878906, 0.11742019653320312, 0.12457084655761719, 0.13172149658203125, 0.1388721466064453, 0.14602279663085938, 0.15317344665527344, 0.1603240966796875, 0.16747474670410156, 0.17462539672851562, 0.1817760467529297, 0.18892669677734375, 0.1960773468017578, 0.20322799682617188, 0.21037864685058594, 0.217529296875]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 3.0, 3.0, 2.0, 6.0, 8.0, 11.0, 7.0, 11.0, 26.0, 34.0, 46.0, 62.0, 67.0, 73.0, 101.0, 107.0, 77.0, 80.0, 59.0, 51.0, 41.0, 25.0, 26.0, 17.0, 12.0, 10.0, 11.0, 8.0, 4.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0924072265625, -0.08945274353027344, -0.08649826049804688, -0.08354377746582031, -0.08058929443359375, -0.07763481140136719, -0.07468032836914062, -0.07172584533691406, -0.0687713623046875, -0.06581687927246094, -0.06286239624023438, -0.05990791320800781, -0.05695343017578125, -0.05399894714355469, -0.051044464111328125, -0.04808998107910156, -0.045135498046875, -0.04218101501464844, -0.039226531982421875, -0.03627204895019531, -0.03331756591796875, -0.030363082885742188, -0.027408599853515625, -0.024454116821289062, -0.0214996337890625, -0.018545150756835938, -0.015590667724609375, -0.012636184692382812, -0.00968170166015625, -0.0067272186279296875, -0.003772735595703125, -0.0008182525634765625, 0.00213623046875, 0.0050907135009765625, 0.008045196533203125, 0.010999679565429688, 0.01395416259765625, 0.016908645629882812, 0.019863128662109375, 0.022817611694335938, 0.0257720947265625, 0.028726577758789062, 0.031681060791015625, 0.03463554382324219, 0.03759002685546875, 0.04054450988769531, 0.043498992919921875, 0.04645347595214844, 0.049407958984375, 0.05236244201660156, 0.055316925048828125, 0.05827140808105469, 0.06122589111328125, 0.06418037414550781, 0.06713485717773438, 0.07008934020996094, 0.0730438232421875, 0.07599830627441406, 0.07895278930664062, 0.08190727233886719, 0.08486175537109375, 0.08781623840332031, 0.09077072143554688, 0.09372520446777344, 0.0966796875]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 2.0, 6.0, 10.0, 10.0, 9.0, 23.0, 25.0, 48.0, 60.0, 108.0, 135.0, 175.0, 141.0, 87.0, 55.0, 38.0, 24.0, 14.0, 16.0, 2.0, 7.0, 4.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-2.293674945831299, -2.240849256515503, -2.188023328781128, -2.135197639465332, -2.082371950149536, -2.029546022415161, -1.9767203330993652, -1.9238945245742798, -1.8710687160491943, -1.8182429075241089, -1.765417218208313, -1.7125914096832275, -1.659765601158142, -1.6069397926330566, -1.5541141033172607, -1.5012882947921753, -1.4484626054763794, -1.395636796951294, -1.342811107635498, -1.2899852991104126, -1.2371594905853271, -1.1843338012695312, -1.1315079927444458, -1.0786821842193604, -1.0258564949035645, -0.9730307459831238, -0.9202049374580383, -0.8673791885375977, -0.8145533800125122, -0.7617276310920715, -0.7089018821716309, -0.6560760736465454, -0.60325026512146, -0.5504245162010193, -0.49759870767593384, -0.44477295875549316, -0.3919471800327301, -0.33912140130996704, -0.28629565238952637, -0.2334698736667633, -0.18064409494400024, -0.12781831622123718, -0.07499255239963531, -0.022166788578033447, 0.030658990144729614, 0.08348476886749268, 0.13631051778793335, 0.1891362965106964, 0.24196207523345947, 0.29478785395622253, 0.3476136326789856, 0.40043938159942627, 0.45326516032218933, 0.5060909390449524, 0.5589166879653931, 0.6117424964904785, 0.6645682454109192, 0.7173939943313599, 0.7702198028564453, 0.823045551776886, 0.8758713006973267, 0.9286971092224121, 0.9815228581428528, 1.0343486070632935, 1.087174415588379]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 7.0, 6.0, 14.0, 19.0, 22.0, 15.0, 24.0, 36.0, 37.0, 46.0, 37.0, 49.0, 54.0, 70.0, 56.0, 51.0, 68.0, 49.0, 58.0, 40.0, 43.0, 41.0, 28.0, 28.0, 29.0, 21.0, 14.0, 13.0, 6.0, 4.0, 4.0, 8.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5013625621795654, -2.4256365299224854, -2.3499104976654053, -2.2741847038269043, -2.198458671569824, -2.122732639312744, -2.047006607055664, -1.971280574798584, -1.8955546617507935, -1.8198286294937134, -1.7441027164459229, -1.6683766841888428, -1.5926506519317627, -1.5169247388839722, -1.441198706626892, -1.3654727935791016, -1.2897467613220215, -1.2140207290649414, -1.1382948160171509, -1.0625687837600708, -0.9868428111076355, -0.9111168384552002, -0.8353908061981201, -0.7596648335456848, -0.6839388608932495, -0.6082128882408142, -0.5324869155883789, -0.45676088333129883, -0.3810349106788635, -0.3053089380264282, -0.22958293557167053, -0.15385693311691284, -0.07813096046447754, -0.0024049729108810425, 0.07332101464271545, 0.14904700219631195, 0.22477298974990845, 0.30049896240234375, 0.37622496485710144, 0.45195096731185913, 0.5276769399642944, 0.6034029126167297, 0.679128885269165, 0.7548549175262451, 0.8305808901786804, 0.9063068628311157, 0.9820328950881958, 1.0577588081359863, 1.1334848403930664, 1.2092108726501465, 1.284936785697937, 1.360662817955017, 1.4363887310028076, 1.5121147632598877, 1.5878407955169678, 1.6635668277740479, 1.7392927408218384, 1.8150187730789185, 1.890744686126709, 1.966470718383789, 2.042196750640869, 2.117922782897949, 2.19364857673645, 2.2693746089935303, 2.3451006412506104]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 2.0, 9.0, 10.0, 11.0, 23.0, 38.0, 64.0, 100.0, 178.0, 323.0, 536.0, 1231.0, 2860.0, 9694.0, 53355.0, 3742556.0, 350587.0, 23317.0, 5555.0, 1963.0, 825.0, 375.0, 262.0, 144.0, 77.0, 54.0, 45.0, 23.0, 17.0, 16.0, 8.0, 7.0, 4.0, 4.0, 4.0, 5.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4013671875, -0.3883323669433594, -0.37529754638671875, -0.3622627258300781, -0.3492279052734375, -0.3361930847167969, -0.32315826416015625, -0.3101234436035156, -0.297088623046875, -0.2840538024902344, -0.27101898193359375, -0.2579841613769531, -0.2449493408203125, -0.23191452026367188, -0.21887969970703125, -0.20584487915039062, -0.19281005859375, -0.17977523803710938, -0.16674041748046875, -0.15370559692382812, -0.1406707763671875, -0.12763595581054688, -0.11460113525390625, -0.10156631469726562, -0.088531494140625, -0.07549667358398438, -0.06246185302734375, -0.049427032470703125, -0.0363922119140625, -0.023357391357421875, -0.01032257080078125, 0.002712249755859375, 0.0157470703125, 0.028781890869140625, 0.04181671142578125, 0.054851531982421875, 0.0678863525390625, 0.08092117309570312, 0.09395599365234375, 0.10699081420898438, 0.120025634765625, 0.13306045532226562, 0.14609527587890625, 0.15913009643554688, 0.1721649169921875, 0.18519973754882812, 0.19823455810546875, 0.21126937866210938, 0.22430419921875, 0.23733901977539062, 0.25037384033203125, 0.2634086608886719, 0.2764434814453125, 0.2894783020019531, 0.30251312255859375, 0.3155479431152344, 0.328582763671875, 0.3416175842285156, 0.35465240478515625, 0.3676872253417969, 0.3807220458984375, 0.3937568664550781, 0.40679168701171875, 0.4198265075683594, 0.432861328125]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 4.0, 6.0, 10.0, 11.0, 15.0, 41.0, 43.0, 72.0, 68.0, 85.0, 122.0, 108.0, 102.0, 91.0, 63.0, 52.0, 37.0, 25.0, 16.0, 4.0, 6.0, 4.0, 5.0, 6.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11700439453125, -0.11195659637451172, -0.10690879821777344, -0.10186100006103516, -0.09681320190429688, -0.0917654037475586, -0.08671760559082031, -0.08166980743408203, -0.07662200927734375, -0.07157421112060547, -0.06652641296386719, -0.061478614807128906, -0.056430816650390625, -0.051383018493652344, -0.04633522033691406, -0.04128742218017578, -0.0362396240234375, -0.03119182586669922, -0.026144027709960938, -0.021096229553222656, -0.016048431396484375, -0.011000633239746094, -0.0059528350830078125, -0.0009050369262695312, 0.00414276123046875, 0.009190559387207031, 0.014238357543945312, 0.019286155700683594, 0.024333953857421875, 0.029381752014160156, 0.03442955017089844, 0.03947734832763672, 0.044525146484375, 0.04957294464111328, 0.05462074279785156, 0.059668540954589844, 0.06471633911132812, 0.0697641372680664, 0.07481193542480469, 0.07985973358154297, 0.08490753173828125, 0.08995532989501953, 0.09500312805175781, 0.1000509262084961, 0.10509872436523438, 0.11014652252197266, 0.11519432067871094, 0.12024211883544922, 0.1252899169921875, 0.13033771514892578, 0.13538551330566406, 0.14043331146240234, 0.14548110961914062, 0.1505289077758789, 0.1555767059326172, 0.16062450408935547, 0.16567230224609375, 0.17072010040283203, 0.1757678985595703, 0.1808156967163086, 0.18586349487304688, 0.19091129302978516, 0.19595909118652344, 0.20100688934326172, 0.2060546875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 3.0, 7.0, 12.0, 23.0, 15.0, 35.0, 54.0, 88.0, 162.0, 272.0, 498.0, 1023.0, 2611.0, 8841.0, 53413.0, 2214403.0, 1850058.0, 49405.0, 8456.0, 2551.0, 1006.0, 524.0, 289.0, 189.0, 128.0, 75.0, 52.0, 22.0, 23.0, 14.0, 8.0, 10.0, 3.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.23583984375, -0.22676467895507812, -0.21768951416015625, -0.20861434936523438, -0.1995391845703125, -0.19046401977539062, -0.18138885498046875, -0.17231369018554688, -0.163238525390625, -0.15416336059570312, -0.14508819580078125, -0.13601303100585938, -0.1269378662109375, -0.11786270141601562, -0.10878753662109375, -0.09971237182617188, -0.09063720703125, -0.08156204223632812, -0.07248687744140625, -0.06341171264648438, -0.0543365478515625, -0.045261383056640625, -0.03618621826171875, -0.027111053466796875, -0.018035888671875, -0.008960723876953125, 0.00011444091796875, 0.009189605712890625, 0.0182647705078125, 0.027339935302734375, 0.03641510009765625, 0.045490264892578125, 0.0545654296875, 0.06364059448242188, 0.07271575927734375, 0.08179092407226562, 0.0908660888671875, 0.09994125366210938, 0.10901641845703125, 0.11809158325195312, 0.127166748046875, 0.13624191284179688, 0.14531707763671875, 0.15439224243164062, 0.1634674072265625, 0.17254257202148438, 0.18161773681640625, 0.19069290161132812, 0.19976806640625, 0.20884323120117188, 0.21791839599609375, 0.22699356079101562, 0.2360687255859375, 0.24514389038085938, 0.25421905517578125, 0.2632942199707031, 0.272369384765625, 0.2814445495605469, 0.29051971435546875, 0.2995948791503906, 0.3086700439453125, 0.3177452087402344, 0.32682037353515625, 0.3358955383300781, 0.344970703125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 4.0, 6.0, 8.0, 14.0, 14.0, 22.0, 27.0, 57.0, 107.0, 238.0, 748.0, 1904.0, 540.0, 188.0, 83.0, 48.0, 22.0, 19.0, 9.0, 6.0, 3.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08050537109375, -0.07655048370361328, -0.07259559631347656, -0.06864070892333984, -0.06468582153320312, -0.060730934143066406, -0.05677604675292969, -0.05282115936279297, -0.04886627197265625, -0.04491138458251953, -0.04095649719238281, -0.037001609802246094, -0.033046722412109375, -0.029091835021972656, -0.025136947631835938, -0.02118206024169922, -0.0172271728515625, -0.013272285461425781, -0.009317398071289062, -0.005362510681152344, -0.001407623291015625, 0.0025472640991210938, 0.0065021514892578125, 0.010457038879394531, 0.01441192626953125, 0.01836681365966797, 0.022321701049804688, 0.026276588439941406, 0.030231475830078125, 0.034186363220214844, 0.03814125061035156, 0.04209613800048828, 0.046051025390625, 0.05000591278076172, 0.05396080017089844, 0.057915687561035156, 0.061870574951171875, 0.0658254623413086, 0.06978034973144531, 0.07373523712158203, 0.07769012451171875, 0.08164501190185547, 0.08559989929199219, 0.0895547866821289, 0.09350967407226562, 0.09746456146240234, 0.10141944885253906, 0.10537433624267578, 0.1093292236328125, 0.11328411102294922, 0.11723899841308594, 0.12119388580322266, 0.12514877319335938, 0.1291036605834961, 0.1330585479736328, 0.13701343536376953, 0.14096832275390625, 0.14492321014404297, 0.1488780975341797, 0.1528329849243164, 0.15678787231445312, 0.16074275970458984, 0.16469764709472656, 0.16865253448486328, 0.172607421875]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 7.0, 12.0, 37.0, 121.0, 254.0, 285.0, 174.0, 79.0, 25.0, 7.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6286548376083374, -0.6005786657333374, -0.5725024938583374, -0.5444262623786926, -0.5163500905036926, -0.4882739186286926, -0.46019771695137024, -0.43212151527404785, -0.40404534339904785, -0.37596917152404785, -0.34789296984672546, -0.3198167681694031, -0.2917405962944031, -0.2636644244194031, -0.2355882227420807, -0.2075120359659195, -0.1794358491897583, -0.1513596624135971, -0.12328347563743591, -0.09520728886127472, -0.06713110208511353, -0.03905491530895233, -0.010978728532791138, 0.017097458243370056, 0.04517364501953125, 0.07324983179569244, 0.10132601857185364, 0.12940220534801483, 0.15747839212417603, 0.18555457890033722, 0.2136307656764984, 0.2417069524526596, 0.2697831392288208, 0.2978593111038208, 0.3259355127811432, 0.3540117144584656, 0.3820878863334656, 0.4101640582084656, 0.43824025988578796, 0.46631646156311035, 0.49439263343811035, 0.5224688053131104, 0.5505449771881104, 0.5786212086677551, 0.6066973805427551, 0.6347735524177551, 0.6628497838973999, 0.6909259557723999, 0.7190021276473999, 0.7470782995223999, 0.7751544713973999, 0.8032307028770447, 0.8313068747520447, 0.8593830466270447, 0.8874592781066895, 0.9155354499816895, 0.9436116218566895, 0.9716877937316895, 0.9997639656066895, 1.0278401374816895, 1.0559163093566895, 1.083992600440979, 1.112068772315979, 1.140144944190979, 1.168221116065979]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 3.0, 10.0, 10.0, 10.0, 13.0, 14.0, 13.0, 28.0, 47.0, 31.0, 46.0, 39.0, 42.0, 60.0, 46.0, 55.0, 45.0, 46.0, 55.0, 66.0, 56.0, 51.0, 34.0, 30.0, 39.0, 16.0, 23.0, 20.0, 9.0, 10.0, 8.0, 6.0, 3.0, 5.0, 3.0, 4.0, 2.0, 4.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.40505343675613403, -0.3944965600967407, -0.3839397132396698, -0.3733828365802765, -0.3628259599208832, -0.35226911306381226, -0.34171223640441895, -0.33115535974502563, -0.3205984830856323, -0.310041606426239, -0.2994847595691681, -0.2889278829097748, -0.27837100625038147, -0.26781415939331055, -0.25725728273391724, -0.24670040607452393, -0.236143559217453, -0.2255866974592209, -0.21502982079982758, -0.20447295904159546, -0.19391608238220215, -0.18335922062397003, -0.17280235886573792, -0.1622454822063446, -0.1516886204481125, -0.14113175868988037, -0.13057488203048706, -0.12001802027225494, -0.10946115106344223, -0.09890428185462952, -0.0883474200963974, -0.07779055088758469, -0.06723368167877197, -0.05667681246995926, -0.046119946986436844, -0.03556308150291443, -0.025006212294101715, -0.014449343085289001, -0.0038924813270568848, 0.006664387881755829, 0.017221257090568542, 0.027778124436736107, 0.03833499178290367, 0.048891857266426086, 0.0594487264752388, 0.07000559568405151, 0.08056245744228363, 0.09111932665109634, 0.10167619585990906, 0.11223306506872177, 0.12278993427753448, 0.1333467960357666, 0.1439036726951599, 0.15446053445339203, 0.16501739621162415, 0.17557427287101746, 0.18613113462924957, 0.1966879963874817, 0.207244873046875, 0.21780173480510712, 0.22835859656333923, 0.23891547322273254, 0.24947233498096466, 0.2600291967391968, 0.2705860733985901]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 5.0, 12.0, 6.0, 12.0, 20.0, 29.0, 31.0, 38.0, 55.0, 83.0, 135.0, 185.0, 241.0, 410.0, 653.0, 1197.0, 2318.0, 5208.0, 12665.0, 41014.0, 172592.0, 518985.0, 216075.0, 49822.0, 15000.0, 5689.0, 2563.0, 1362.0, 810.0, 449.0, 294.0, 198.0, 106.0, 85.0, 59.0, 40.0, 24.0, 22.0, 15.0, 8.0, 7.0, 9.0, 6.0, 9.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.3349609375, -0.3243522644042969, -0.31374359130859375, -0.3031349182128906, -0.2925262451171875, -0.2819175720214844, -0.27130889892578125, -0.2607002258300781, -0.250091552734375, -0.23948287963867188, -0.22887420654296875, -0.21826553344726562, -0.2076568603515625, -0.19704818725585938, -0.18643951416015625, -0.17583084106445312, -0.16522216796875, -0.15461349487304688, -0.14400482177734375, -0.13339614868164062, -0.1227874755859375, -0.11217880249023438, -0.10157012939453125, -0.09096145629882812, -0.080352783203125, -0.06974411010742188, -0.05913543701171875, -0.048526763916015625, -0.0379180908203125, -0.027309417724609375, -0.01670074462890625, -0.006092071533203125, 0.0045166015625, 0.015125274658203125, 0.02573394775390625, 0.036342620849609375, 0.0469512939453125, 0.057559967041015625, 0.06816864013671875, 0.07877731323242188, 0.089385986328125, 0.09999465942382812, 0.11060333251953125, 0.12121200561523438, 0.1318206787109375, 0.14242935180664062, 0.15303802490234375, 0.16364669799804688, 0.17425537109375, 0.18486404418945312, 0.19547271728515625, 0.20608139038085938, 0.2166900634765625, 0.22729873657226562, 0.23790740966796875, 0.24851608276367188, 0.259124755859375, 0.2697334289550781, 0.28034210205078125, 0.2909507751464844, 0.3015594482421875, 0.3121681213378906, 0.32277679443359375, 0.3333854675292969, 0.343994140625]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 2.0, 11.0, 6.0, 20.0, 26.0, 40.0, 56.0, 67.0, 84.0, 105.0, 107.0, 113.0, 98.0, 76.0, 63.0, 42.0, 27.0, 19.0, 13.0, 4.0, 8.0, 1.0, 7.0, 1.0, 1.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.112548828125, -0.10758399963378906, -0.10261917114257812, -0.09765434265136719, -0.09268951416015625, -0.08772468566894531, -0.08275985717773438, -0.07779502868652344, -0.0728302001953125, -0.06786537170410156, -0.06290054321289062, -0.05793571472167969, -0.05297088623046875, -0.04800605773925781, -0.043041229248046875, -0.03807640075683594, -0.033111572265625, -0.028146743774414062, -0.023181915283203125, -0.018217086791992188, -0.01325225830078125, -0.008287429809570312, -0.003322601318359375, 0.0016422271728515625, 0.0066070556640625, 0.011571884155273438, 0.016536712646484375, 0.021501541137695312, 0.02646636962890625, 0.03143119812011719, 0.036396026611328125, 0.04136085510253906, 0.04632568359375, 0.05129051208496094, 0.056255340576171875, 0.06122016906738281, 0.06618499755859375, 0.07114982604980469, 0.07611465454101562, 0.08107948303222656, 0.0860443115234375, 0.09100914001464844, 0.09597396850585938, 0.10093879699707031, 0.10590362548828125, 0.11086845397949219, 0.11583328247070312, 0.12079811096191406, 0.125762939453125, 0.13072776794433594, 0.13569259643554688, 0.1406574249267578, 0.14562225341796875, 0.1505870819091797, 0.15555191040039062, 0.16051673889160156, 0.1654815673828125, 0.17044639587402344, 0.17541122436523438, 0.1803760528564453, 0.18534088134765625, 0.1903057098388672, 0.19527053833007812, 0.20023536682128906, 0.2052001953125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 2.0, 3.0, 5.0, 11.0, 10.0, 10.0, 18.0, 32.0, 30.0, 45.0, 65.0, 91.0, 156.0, 228.0, 413.0, 727.0, 1398.0, 2777.0, 6285.0, 14888.0, 39262.0, 121943.0, 351994.0, 334014.0, 112123.0, 36265.0, 13961.0, 5923.0, 2728.0, 1313.0, 723.0, 379.0, 245.0, 141.0, 102.0, 76.0, 46.0, 29.0, 31.0, 18.0, 19.0, 6.0, 8.0, 1.0, 6.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.22998046875, -0.22320938110351562, -0.21643829345703125, -0.20966720581054688, -0.2028961181640625, -0.19612503051757812, -0.18935394287109375, -0.18258285522460938, -0.175811767578125, -0.16904067993164062, -0.16226959228515625, -0.15549850463867188, -0.1487274169921875, -0.14195632934570312, -0.13518524169921875, -0.12841415405273438, -0.12164306640625, -0.11487197875976562, -0.10810089111328125, -0.10132980346679688, -0.0945587158203125, -0.08778762817382812, -0.08101654052734375, -0.07424545288085938, -0.067474365234375, -0.060703277587890625, -0.05393218994140625, -0.047161102294921875, -0.0403900146484375, -0.033618927001953125, -0.02684783935546875, -0.020076751708984375, -0.0133056640625, -0.006534576416015625, 0.00023651123046875, 0.007007598876953125, 0.0137786865234375, 0.020549774169921875, 0.02732086181640625, 0.034091949462890625, 0.040863037109375, 0.047634124755859375, 0.05440521240234375, 0.061176300048828125, 0.0679473876953125, 0.07471847534179688, 0.08148956298828125, 0.08826065063476562, 0.09503173828125, 0.10180282592773438, 0.10857391357421875, 0.11534500122070312, 0.1221160888671875, 0.12888717651367188, 0.13565826416015625, 0.14242935180664062, 0.149200439453125, 0.15597152709960938, 0.16274261474609375, 0.16951370239257812, 0.1762847900390625, 0.18305587768554688, 0.18982696533203125, 0.19659805297851562, 0.203369140625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 3.0, 9.0, 3.0, 10.0, 4.0, 8.0, 13.0, 11.0, 14.0, 18.0, 15.0, 15.0, 13.0, 27.0, 30.0, 28.0, 22.0, 33.0, 45.0, 39.0, 47.0, 41.0, 28.0, 46.0, 45.0, 32.0, 52.0, 44.0, 33.0, 33.0, 29.0, 37.0, 30.0, 22.0, 16.0, 17.0, 20.0, 18.0, 13.0, 5.0, 11.0, 6.0, 8.0, 2.0, 1.0, 5.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.309326171875, -0.299713134765625, -0.29010009765625, -0.280487060546875, -0.2708740234375, -0.261260986328125, -0.25164794921875, -0.242034912109375, -0.232421875, -0.222808837890625, -0.21319580078125, -0.203582763671875, -0.1939697265625, -0.184356689453125, -0.17474365234375, -0.165130615234375, -0.155517578125, -0.145904541015625, -0.13629150390625, -0.126678466796875, -0.1170654296875, -0.107452392578125, -0.09783935546875, -0.088226318359375, -0.07861328125, -0.069000244140625, -0.05938720703125, -0.049774169921875, -0.0401611328125, -0.030548095703125, -0.02093505859375, -0.011322021484375, -0.001708984375, 0.007904052734375, 0.01751708984375, 0.027130126953125, 0.0367431640625, 0.046356201171875, 0.05596923828125, 0.065582275390625, 0.0751953125, 0.084808349609375, 0.09442138671875, 0.104034423828125, 0.1136474609375, 0.123260498046875, 0.13287353515625, 0.142486572265625, 0.152099609375, 0.161712646484375, 0.17132568359375, 0.180938720703125, 0.1905517578125, 0.200164794921875, 0.20977783203125, 0.219390869140625, 0.22900390625, 0.238616943359375, 0.24822998046875, 0.257843017578125, 0.2674560546875, 0.277069091796875, 0.28668212890625, 0.296295166015625, 0.305908203125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 4.0, 5.0, 10.0, 34.0, 50.0, 95.0, 341.0, 1261.0, 6627.0, 94544.0, 857582.0, 80151.0, 6155.0, 1165.0, 311.0, 116.0, 54.0, 29.0, 6.0, 11.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.183837890625, -0.17714691162109375, -0.1704559326171875, -0.16376495361328125, -0.157073974609375, -0.15038299560546875, -0.1436920166015625, -0.13700103759765625, -0.13031005859375, -0.12361907958984375, -0.1169281005859375, -0.11023712158203125, -0.103546142578125, -0.09685516357421875, -0.0901641845703125, -0.08347320556640625, -0.0767822265625, -0.07009124755859375, -0.0634002685546875, -0.05670928955078125, -0.050018310546875, -0.04332733154296875, -0.0366363525390625, -0.02994537353515625, -0.02325439453125, -0.01656341552734375, -0.0098724365234375, -0.00318145751953125, 0.003509521484375, 0.01020050048828125, 0.0168914794921875, 0.02358245849609375, 0.0302734375, 0.03696441650390625, 0.0436553955078125, 0.05034637451171875, 0.057037353515625, 0.06372833251953125, 0.0704193115234375, 0.07711029052734375, 0.08380126953125, 0.09049224853515625, 0.0971832275390625, 0.10387420654296875, 0.110565185546875, 0.11725616455078125, 0.1239471435546875, 0.13063812255859375, 0.1373291015625, 0.14402008056640625, 0.1507110595703125, 0.15740203857421875, 0.164093017578125, 0.17078399658203125, 0.1774749755859375, 0.18416595458984375, 0.19085693359375, 0.19754791259765625, 0.2042388916015625, 0.21092987060546875, 0.217620849609375, 0.22431182861328125, 0.2310028076171875, 0.23769378662109375, 0.244384765625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 6.0, 3.0, 6.0, 9.0, 7.0, 6.0, 15.0, 10.0, 14.0, 12.0, 24.0, 18.0, 25.0, 34.0, 35.0, 60.0, 56.0, 78.0, 93.0, 100.0, 70.0, 50.0, 57.0, 39.0, 33.0, 25.0, 19.0, 15.0, 13.0, 21.0, 8.0, 8.0, 7.0, 8.0, 4.0, 4.0, 2.0, 7.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.969141006469727e-05, -7.726624608039856e-05, -7.484108209609985e-05, -7.241591811180115e-05, -6.999075412750244e-05, -6.756559014320374e-05, -6.514042615890503e-05, -6.271526217460632e-05, -6.029009819030762e-05, -5.786493420600891e-05, -5.5439770221710205e-05, -5.30146062374115e-05, -5.058944225311279e-05, -4.816427826881409e-05, -4.573911428451538e-05, -4.3313950300216675e-05, -4.088878631591797e-05, -3.846362233161926e-05, -3.603845834732056e-05, -3.361329436302185e-05, -3.1188130378723145e-05, -2.876296639442444e-05, -2.6337802410125732e-05, -2.3912638425827026e-05, -2.148747444152832e-05, -1.9062310457229614e-05, -1.6637146472930908e-05, -1.4211982488632202e-05, -1.1786818504333496e-05, -9.36165452003479e-06, -6.936490535736084e-06, -4.511326551437378e-06, -2.086162567138672e-06, 3.390014171600342e-07, 2.7641654014587402e-06, 5.189329385757446e-06, 7.614493370056152e-06, 1.0039657354354858e-05, 1.2464821338653564e-05, 1.488998532295227e-05, 1.7315149307250977e-05, 1.9740313291549683e-05, 2.216547727584839e-05, 2.4590641260147095e-05, 2.70158052444458e-05, 2.9440969228744507e-05, 3.186613321304321e-05, 3.429129719734192e-05, 3.6716461181640625e-05, 3.914162516593933e-05, 4.156678915023804e-05, 4.399195313453674e-05, 4.641711711883545e-05, 4.8842281103134155e-05, 5.126744508743286e-05, 5.369260907173157e-05, 5.6117773056030273e-05, 5.854293704032898e-05, 6.0968101024627686e-05, 6.339326500892639e-05, 6.58184289932251e-05, 6.82435929775238e-05, 7.066875696182251e-05, 7.309392094612122e-05, 7.551908493041992e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 3.0, 2.0, 2.0, 9.0, 10.0, 13.0, 27.0, 46.0, 82.0, 122.0, 258.0, 517.0, 1359.0, 4766.0, 26534.0, 272837.0, 663107.0, 65724.0, 9391.0, 2250.0, 769.0, 338.0, 171.0, 70.0, 46.0, 38.0, 17.0, 19.0, 9.0, 6.0, 8.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1719970703125, -0.16681861877441406, -0.16164016723632812, -0.1564617156982422, -0.15128326416015625, -0.1461048126220703, -0.14092636108398438, -0.13574790954589844, -0.1305694580078125, -0.12539100646972656, -0.12021255493164062, -0.11503410339355469, -0.10985565185546875, -0.10467720031738281, -0.09949874877929688, -0.09432029724121094, -0.089141845703125, -0.08396339416503906, -0.07878494262695312, -0.07360649108886719, -0.06842803955078125, -0.06324958801269531, -0.058071136474609375, -0.05289268493652344, -0.0477142333984375, -0.04253578186035156, -0.037357330322265625, -0.03217887878417969, -0.02700042724609375, -0.021821975708007812, -0.016643524169921875, -0.011465072631835938, -0.00628662109375, -0.0011081695556640625, 0.004070281982421875, 0.009248733520507812, 0.01442718505859375, 0.019605636596679688, 0.024784088134765625, 0.029962539672851562, 0.0351409912109375, 0.04031944274902344, 0.045497894287109375, 0.05067634582519531, 0.05585479736328125, 0.06103324890136719, 0.06621170043945312, 0.07139015197753906, 0.076568603515625, 0.08174705505371094, 0.08692550659179688, 0.09210395812988281, 0.09728240966796875, 0.10246086120605469, 0.10763931274414062, 0.11281776428222656, 0.1179962158203125, 0.12317466735839844, 0.12835311889648438, 0.1335315704345703, 0.13871002197265625, 0.1438884735107422, 0.14906692504882812, 0.15424537658691406, 0.159423828125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 4.0, 5.0, 5.0, 8.0, 14.0, 22.0, 23.0, 34.0, 48.0, 61.0, 97.0, 93.0, 122.0, 130.0, 93.0, 65.0, 53.0, 38.0, 28.0, 16.0, 20.0, 11.0, 5.0, 3.0, 4.0, 3.0, 2.0, 3.0], "bins": [-0.209716796875, -0.2054119110107422, -0.20110702514648438, -0.19680213928222656, -0.19249725341796875, -0.18819236755371094, -0.18388748168945312, -0.1795825958251953, -0.1752777099609375, -0.1709728240966797, -0.16666793823242188, -0.16236305236816406, -0.15805816650390625, -0.15375328063964844, -0.14944839477539062, -0.1451435089111328, -0.140838623046875, -0.1365337371826172, -0.13222885131835938, -0.12792396545410156, -0.12361907958984375, -0.11931419372558594, -0.11500930786132812, -0.11070442199707031, -0.1063995361328125, -0.10209465026855469, -0.09778976440429688, -0.09348487854003906, -0.08917999267578125, -0.08487510681152344, -0.08057022094726562, -0.07626533508300781, -0.07196044921875, -0.06765556335449219, -0.06335067749023438, -0.05904579162597656, -0.05474090576171875, -0.05043601989746094, -0.046131134033203125, -0.04182624816894531, -0.0375213623046875, -0.03321647644042969, -0.028911590576171875, -0.024606704711914062, -0.02030181884765625, -0.015996932983398438, -0.011692047119140625, -0.0073871612548828125, -0.003082275390625, 0.0012226104736328125, 0.005527496337890625, 0.009832382202148438, 0.01413726806640625, 0.018442153930664062, 0.022747039794921875, 0.027051925659179688, 0.0313568115234375, 0.03566169738769531, 0.039966583251953125, 0.04427146911621094, 0.04857635498046875, 0.05288124084472656, 0.057186126708984375, 0.06149101257324219, 0.0657958984375]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 5.0, 5.0, 4.0, 8.0, 10.0, 19.0, 32.0, 44.0, 72.0, 117.0, 148.0, 148.0, 140.0, 95.0, 63.0, 43.0, 18.0, 15.0, 10.0, 3.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2023637294769287, -1.142227292060852, -1.082090973854065, -1.0219545364379883, -0.9618180990219116, -0.9016817212104797, -0.8415453433990479, -0.7814089059829712, -0.7212724685668945, -0.6611360907554626, -0.600999653339386, -0.5408632755279541, -0.48072683811187744, -0.42059046030044556, -0.3604540526866913, -0.300317645072937, -0.24018126726150513, -0.18004485964775085, -0.11990845948457718, -0.0597720593214035, 0.00036434829235076904, 0.06050074100494385, 0.12063714861869812, 0.1807735562324524, 0.24090996384620667, 0.30104637145996094, 0.3611827790737152, 0.4213191866874695, 0.48145556449890137, 0.541592001914978, 0.6017283797264099, 0.6618647575378418, 0.7220011949539185, 0.7821375727653503, 0.842274010181427, 0.9024103879928589, 0.9625468254089355, 1.0226831436157227, 1.0828195810317993, 1.142956018447876, 1.2030924558639526, 1.2632288932800293, 1.3233652114868164, 1.383501648902893, 1.4436380863189697, 1.5037744045257568, 1.5639108419418335, 1.6240472793579102, 1.6841835975646973, 1.744320034980774, 1.804456353187561, 1.8645927906036377, 1.9247292280197144, 1.984865665435791, 2.045001983642578, 2.1051383018493652, 2.1652748584747314, 2.2254111766815186, 2.2855477333068848, 2.345684051513672, 2.405820369720459, 2.465956926345825, 2.5260932445526123, 2.5862298011779785, 2.6463661193847656]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 7.0, 6.0, 11.0, 10.0, 4.0, 7.0, 9.0, 19.0, 20.0, 22.0, 16.0, 25.0, 38.0, 34.0, 30.0, 49.0, 47.0, 32.0, 56.0, 45.0, 33.0, 40.0, 44.0, 39.0, 47.0, 39.0, 41.0, 26.0, 18.0, 35.0, 25.0, 20.0, 22.0, 13.0, 19.0, 7.0, 12.0, 7.0, 7.0, 10.0, 6.0, 3.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8370895385742188, -1.7772239446640015, -1.7173584699630737, -1.6574928760528564, -1.5976274013519287, -1.5377618074417114, -1.4778962135314941, -1.4180307388305664, -1.3581651449203491, -1.2982995510101318, -1.238434076309204, -1.1785684823989868, -1.118703007698059, -1.0588374137878418, -0.9989718794822693, -0.9391063451766968, -0.8792408108711243, -0.8193752765655518, -0.7595097422599792, -0.6996442079544067, -0.6397786140441895, -0.5799130797386169, -0.5200475454330444, -0.46018198132514954, -0.400316447019577, -0.3404509127140045, -0.2805853486061096, -0.2207198143005371, -0.1608542650938034, -0.1009887158870697, -0.04112318158149719, 0.018742382526397705, 0.07860791683197021, 0.13847346603870392, 0.19833901524543762, 0.25820454955101013, 0.31807011365890503, 0.37793564796447754, 0.43780118227005005, 0.49766674637794495, 0.5575323104858398, 0.6173978447914124, 0.6772633790969849, 0.7371289730072021, 0.7969945073127747, 0.8568600416183472, 0.9167255759239197, 0.9765911102294922, 1.03645658493042, 1.0963221788406372, 1.156187653541565, 1.2160532474517822, 1.27591872215271, 1.3357843160629272, 1.3956499099731445, 1.4555153846740723, 1.5153809785842896, 1.5752465724945068, 1.6351120471954346, 1.6949776411056519, 1.7548431158065796, 1.8147087097167969, 1.8745741844177246, 1.934439778327942, 1.9943053722381592]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 5.0, 4.0, 3.0, 8.0, 11.0, 17.0, 27.0, 44.0, 91.0, 138.0, 226.0, 395.0, 775.0, 1529.0, 3807.0, 13403.0, 85896.0, 3851177.0, 206959.0, 20638.0, 5226.0, 1897.0, 853.0, 451.0, 248.0, 152.0, 84.0, 54.0, 51.0, 26.0, 28.0, 14.0, 12.0, 10.0, 7.0, 2.0, 6.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.313720703125, -0.3009910583496094, -0.28826141357421875, -0.2755317687988281, -0.2628021240234375, -0.2500724792480469, -0.23734283447265625, -0.22461318969726562, -0.211883544921875, -0.19915390014648438, -0.18642425537109375, -0.17369461059570312, -0.1609649658203125, -0.14823532104492188, -0.13550567626953125, -0.12277603149414062, -0.11004638671875, -0.09731674194335938, -0.08458709716796875, -0.07185745239257812, -0.0591278076171875, -0.046398162841796875, -0.03366851806640625, -0.020938873291015625, -0.008209228515625, 0.004520416259765625, 0.01725006103515625, 0.029979705810546875, 0.0427093505859375, 0.055438995361328125, 0.06816864013671875, 0.08089828491210938, 0.0936279296875, 0.10635757446289062, 0.11908721923828125, 0.13181686401367188, 0.1445465087890625, 0.15727615356445312, 0.17000579833984375, 0.18273544311523438, 0.195465087890625, 0.20819473266601562, 0.22092437744140625, 0.23365402221679688, 0.2463836669921875, 0.2591133117675781, 0.27184295654296875, 0.2845726013183594, 0.29730224609375, 0.3100318908691406, 0.32276153564453125, 0.3354911804199219, 0.3482208251953125, 0.3609504699707031, 0.37368011474609375, 0.3864097595214844, 0.399139404296875, 0.4118690490722656, 0.42459869384765625, 0.4373283386230469, 0.4500579833984375, 0.4627876281738281, 0.47551727294921875, 0.4882469177246094, 0.5009765625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 2.0, 6.0, 7.0, 10.0, 20.0, 21.0, 43.0, 55.0, 65.0, 67.0, 92.0, 110.0, 110.0, 94.0, 75.0, 67.0, 43.0, 33.0, 26.0, 21.0, 9.0, 6.0, 4.0, 8.0, 3.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.119873046875, -0.11465072631835938, -0.10942840576171875, -0.10420608520507812, -0.0989837646484375, -0.09376144409179688, -0.08853912353515625, -0.08331680297851562, -0.078094482421875, -0.07287216186523438, -0.06764984130859375, -0.062427520751953125, -0.0572052001953125, -0.051982879638671875, -0.04676055908203125, -0.041538238525390625, -0.03631591796875, -0.031093597412109375, -0.02587127685546875, -0.020648956298828125, -0.0154266357421875, -0.010204315185546875, -0.00498199462890625, 0.000240325927734375, 0.005462646484375, 0.010684967041015625, 0.01590728759765625, 0.021129608154296875, 0.0263519287109375, 0.031574249267578125, 0.03679656982421875, 0.042018890380859375, 0.0472412109375, 0.052463531494140625, 0.05768585205078125, 0.06290817260742188, 0.0681304931640625, 0.07335281372070312, 0.07857513427734375, 0.08379745483398438, 0.089019775390625, 0.09424209594726562, 0.09946441650390625, 0.10468673706054688, 0.1099090576171875, 0.11513137817382812, 0.12035369873046875, 0.12557601928710938, 0.13079833984375, 0.13602066040039062, 0.14124298095703125, 0.14646530151367188, 0.1516876220703125, 0.15690994262695312, 0.16213226318359375, 0.16735458374023438, 0.172576904296875, 0.17779922485351562, 0.18302154541015625, 0.18824386596679688, 0.1934661865234375, 0.19868850708007812, 0.20391082763671875, 0.20913314819335938, 0.21435546875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 11.0, 12.0, 19.0, 35.0, 67.0, 135.0, 242.0, 536.0, 1158.0, 2605.0, 6963.0, 31351.0, 397783.0, 3596363.0, 131971.0, 16923.0, 4658.0, 1768.0, 861.0, 409.0, 193.0, 109.0, 46.0, 28.0, 13.0, 14.0, 3.0, 6.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.23974609375, -0.23157119750976562, -0.22339630126953125, -0.21522140502929688, -0.2070465087890625, -0.19887161254882812, -0.19069671630859375, -0.18252182006835938, -0.174346923828125, -0.16617202758789062, -0.15799713134765625, -0.14982223510742188, -0.1416473388671875, -0.13347244262695312, -0.12529754638671875, -0.11712265014648438, -0.10894775390625, -0.10077285766601562, -0.09259796142578125, -0.08442306518554688, -0.0762481689453125, -0.06807327270507812, -0.05989837646484375, -0.051723480224609375, -0.043548583984375, -0.035373687744140625, -0.02719879150390625, -0.019023895263671875, -0.0108489990234375, -0.002674102783203125, 0.00550079345703125, 0.013675689697265625, 0.0218505859375, 0.030025482177734375, 0.03820037841796875, 0.046375274658203125, 0.0545501708984375, 0.06272506713867188, 0.07089996337890625, 0.07907485961914062, 0.087249755859375, 0.09542465209960938, 0.10359954833984375, 0.11177444458007812, 0.1199493408203125, 0.12812423706054688, 0.13629913330078125, 0.14447402954101562, 0.15264892578125, 0.16082382202148438, 0.16899871826171875, 0.17717361450195312, 0.1853485107421875, 0.19352340698242188, 0.20169830322265625, 0.20987319946289062, 0.218048095703125, 0.22622299194335938, 0.23439788818359375, 0.24257278442382812, 0.2507476806640625, 0.2589225769042969, 0.26709747314453125, 0.2752723693847656, 0.283447265625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 4.0, 5.0, 3.0, 4.0, 8.0, 16.0, 12.0, 29.0, 38.0, 68.0, 165.0, 328.0, 1143.0, 1459.0, 396.0, 169.0, 98.0, 47.0, 24.0, 16.0, 13.0, 10.0, 6.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1126708984375, -0.10865974426269531, -0.10464859008789062, -0.10063743591308594, -0.09662628173828125, -0.09261512756347656, -0.08860397338867188, -0.08459281921386719, -0.0805816650390625, -0.07657051086425781, -0.07255935668945312, -0.06854820251464844, -0.06453704833984375, -0.06052589416503906, -0.056514739990234375, -0.05250358581542969, -0.048492431640625, -0.04448127746582031, -0.040470123291015625, -0.03645896911621094, -0.03244781494140625, -0.028436660766601562, -0.024425506591796875, -0.020414352416992188, -0.0164031982421875, -0.012392044067382812, -0.008380889892578125, -0.0043697357177734375, -0.00035858154296875, 0.0036525726318359375, 0.007663726806640625, 0.011674880981445312, 0.01568603515625, 0.019697189331054688, 0.023708343505859375, 0.027719497680664062, 0.03173065185546875, 0.03574180603027344, 0.039752960205078125, 0.04376411437988281, 0.0477752685546875, 0.05178642272949219, 0.055797576904296875, 0.05980873107910156, 0.06381988525390625, 0.06783103942871094, 0.07184219360351562, 0.07585334777832031, 0.079864501953125, 0.08387565612792969, 0.08788681030273438, 0.09189796447753906, 0.09590911865234375, 0.09992027282714844, 0.10393142700195312, 0.10794258117675781, 0.1119537353515625, 0.11596488952636719, 0.11997604370117188, 0.12398719787597656, 0.12799835205078125, 0.13200950622558594, 0.13602066040039062, 0.1400318145751953, 0.14404296875]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 6.0, 7.0, 15.0, 45.0, 51.0, 114.0, 171.0, 208.0, 172.0, 111.0, 60.0, 23.0, 14.0, 8.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5676390528678894, -0.5452802777290344, -0.5229215025901794, -0.5005627274513245, -0.4782039523124695, -0.4558451771736145, -0.4334864318370819, -0.41112765669822693, -0.38876888155937195, -0.36641010642051697, -0.344051331281662, -0.3216925859451294, -0.2993338108062744, -0.27697503566741943, -0.25461626052856445, -0.23225748538970947, -0.2098987102508545, -0.1875399351119995, -0.16518115997314453, -0.14282239973545074, -0.12046362459659576, -0.09810484945774078, -0.075746089220047, -0.05338731408119202, -0.031028538942337036, -0.008669767528772354, 0.013689003884792328, 0.03604777157306671, 0.05840654671192169, 0.08076532185077667, 0.10312408208847046, 0.12548285722732544, 0.14784163236618042, 0.1702004075050354, 0.19255918264389038, 0.21491794288158417, 0.23727671802043915, 0.2596355080604553, 0.2819942533969879, 0.3043530285358429, 0.3267118036746979, 0.34907057881355286, 0.37142935395240784, 0.39378809928894043, 0.4161468744277954, 0.4385056495666504, 0.46086442470550537, 0.48322319984436035, 0.5055819749832153, 0.5279407501220703, 0.5502995252609253, 0.5726583003997803, 0.5950170755386353, 0.6173758506774902, 0.6397346258163452, 0.6620934009552002, 0.6844521760940552, 0.7068109512329102, 0.7291697263717651, 0.7515285015106201, 0.7738872766494751, 0.7962460517883301, 0.8186048269271851, 0.84096360206604, 0.8633223176002502]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 7.0, 3.0, 3.0, 6.0, 8.0, 15.0, 11.0, 5.0, 26.0, 20.0, 21.0, 34.0, 29.0, 43.0, 44.0, 47.0, 46.0, 44.0, 47.0, 45.0, 53.0, 51.0, 49.0, 44.0, 41.0, 31.0, 32.0, 41.0, 29.0, 23.0, 14.0, 15.0, 15.0, 12.0, 15.0, 10.0, 6.0, 7.0, 6.0, 2.0, 4.0, 1.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.3764731287956238, -0.36572128534317017, -0.35496947169303894, -0.3442176282405853, -0.3334658145904541, -0.3227139711380005, -0.3119621276855469, -0.30121028423309326, -0.29045847058296204, -0.2797066271305084, -0.2689548134803772, -0.2582029700279236, -0.24745114147663116, -0.23669931292533875, -0.22594746947288513, -0.2151956409215927, -0.2044438123703003, -0.19369198381900787, -0.18294015526771545, -0.17218831181526184, -0.16143648326396942, -0.150684654712677, -0.1399328112602234, -0.12918098270893097, -0.11842915415763855, -0.10767732560634613, -0.09692548960447311, -0.0861736536026001, -0.07542182505130768, -0.06466999650001526, -0.05391816049814224, -0.043166324496269226, -0.03241449594497681, -0.02166266366839409, -0.01091083139181137, -0.00015899911522865295, 0.010592833161354065, 0.021344665437936783, 0.0320964977145195, 0.04284833371639252, 0.053600162267684937, 0.06435199081897736, 0.07510382682085037, 0.08585566282272339, 0.09660749137401581, 0.10735931992530823, 0.11811115592718124, 0.12886299192905426, 0.13961482048034668, 0.1503666490316391, 0.16111847758293152, 0.17187032103538513, 0.18262214958667755, 0.19337397813796997, 0.20412582159042358, 0.214877650141716, 0.22562947869300842, 0.23638130724430084, 0.24713313579559326, 0.2578849792480469, 0.2686368227005005, 0.2793886363506317, 0.2901404798030853, 0.30089229345321655, 0.31164413690567017]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 3.0, 5.0, 5.0, 4.0, 11.0, 8.0, 20.0, 21.0, 40.0, 43.0, 77.0, 132.0, 215.0, 389.0, 777.0, 1677.0, 4070.0, 12923.0, 64732.0, 571501.0, 335737.0, 40771.0, 9369.0, 3205.0, 1306.0, 639.0, 345.0, 196.0, 110.0, 78.0, 51.0, 32.0, 22.0, 14.0, 10.0, 9.0, 11.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.421875, -0.40775299072265625, -0.3936309814453125, -0.37950897216796875, -0.365386962890625, -0.35126495361328125, -0.3371429443359375, -0.32302093505859375, -0.30889892578125, -0.29477691650390625, -0.2806549072265625, -0.26653289794921875, -0.252410888671875, -0.23828887939453125, -0.2241668701171875, -0.21004486083984375, -0.1959228515625, -0.18180084228515625, -0.1676788330078125, -0.15355682373046875, -0.139434814453125, -0.12531280517578125, -0.1111907958984375, -0.09706878662109375, -0.08294677734375, -0.06882476806640625, -0.0547027587890625, -0.04058074951171875, -0.026458740234375, -0.01233673095703125, 0.0017852783203125, 0.01590728759765625, 0.030029296875, 0.04415130615234375, 0.0582733154296875, 0.07239532470703125, 0.086517333984375, 0.10063934326171875, 0.1147613525390625, 0.12888336181640625, 0.14300537109375, 0.15712738037109375, 0.1712493896484375, 0.18537139892578125, 0.199493408203125, 0.21361541748046875, 0.2277374267578125, 0.24185943603515625, 0.2559814453125, 0.27010345458984375, 0.2842254638671875, 0.29834747314453125, 0.312469482421875, 0.32659149169921875, 0.3407135009765625, 0.35483551025390625, 0.36895751953125, 0.38307952880859375, 0.3972015380859375, 0.41132354736328125, 0.425445556640625, 0.43956756591796875, 0.4536895751953125, 0.46781158447265625, 0.48193359375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 3.0, 5.0, 4.0, 10.0, 17.0, 11.0, 36.0, 57.0, 64.0, 67.0, 78.0, 99.0, 108.0, 98.0, 84.0, 70.0, 62.0, 33.0, 26.0, 21.0, 15.0, 11.0, 8.0, 4.0, 3.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.125732421875, -0.12077522277832031, -0.11581802368164062, -0.11086082458496094, -0.10590362548828125, -0.10094642639160156, -0.09598922729492188, -0.09103202819824219, -0.0860748291015625, -0.08111763000488281, -0.07616043090820312, -0.07120323181152344, -0.06624603271484375, -0.06128883361816406, -0.056331634521484375, -0.05137443542480469, -0.046417236328125, -0.04146003723144531, -0.036502838134765625, -0.03154563903808594, -0.02658843994140625, -0.021631240844726562, -0.016674041748046875, -0.011716842651367188, -0.0067596435546875, -0.0018024444580078125, 0.003154754638671875, 0.008111953735351562, 0.01306915283203125, 0.018026351928710938, 0.022983551025390625, 0.027940750122070312, 0.03289794921875, 0.03785514831542969, 0.042812347412109375, 0.04776954650878906, 0.05272674560546875, 0.05768394470214844, 0.06264114379882812, 0.06759834289550781, 0.0725555419921875, 0.07751274108886719, 0.08246994018554688, 0.08742713928222656, 0.09238433837890625, 0.09734153747558594, 0.10229873657226562, 0.10725593566894531, 0.112213134765625, 0.11717033386230469, 0.12212753295898438, 0.12708473205566406, 0.13204193115234375, 0.13699913024902344, 0.14195632934570312, 0.1469135284423828, 0.1518707275390625, 0.1568279266357422, 0.16178512573242188, 0.16674232482910156, 0.17169952392578125, 0.17665672302246094, 0.18161392211914062, 0.1865711212158203, 0.1915283203125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 6.0, 4.0, 6.0, 3.0, 12.0, 5.0, 9.0, 17.0, 19.0, 43.0, 40.0, 53.0, 100.0, 106.0, 224.0, 348.0, 557.0, 1124.0, 2504.0, 6108.0, 17899.0, 67399.0, 316621.0, 484074.0, 109158.0, 27030.0, 8498.0, 3297.0, 1475.0, 681.0, 385.0, 237.0, 154.0, 100.0, 72.0, 53.0, 28.0, 27.0, 24.0, 22.0, 13.0, 9.0, 6.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.264892578125, -0.2566566467285156, -0.24842071533203125, -0.24018478393554688, -0.2319488525390625, -0.22371292114257812, -0.21547698974609375, -0.20724105834960938, -0.199005126953125, -0.19076919555664062, -0.18253326416015625, -0.17429733276367188, -0.1660614013671875, -0.15782546997070312, -0.14958953857421875, -0.14135360717773438, -0.13311767578125, -0.12488174438476562, -0.11664581298828125, -0.10840988159179688, -0.1001739501953125, -0.09193801879882812, -0.08370208740234375, -0.07546615600585938, -0.067230224609375, -0.058994293212890625, -0.05075836181640625, -0.042522430419921875, -0.0342864990234375, -0.026050567626953125, -0.01781463623046875, -0.009578704833984375, -0.0013427734375, 0.006893157958984375, 0.01512908935546875, 0.023365020751953125, 0.0316009521484375, 0.039836883544921875, 0.04807281494140625, 0.056308746337890625, 0.064544677734375, 0.07278060913085938, 0.08101654052734375, 0.08925247192382812, 0.0974884033203125, 0.10572433471679688, 0.11396026611328125, 0.12219619750976562, 0.13043212890625, 0.13866806030273438, 0.14690399169921875, 0.15513992309570312, 0.1633758544921875, 0.17161178588867188, 0.17984771728515625, 0.18808364868164062, 0.196319580078125, 0.20455551147460938, 0.21279144287109375, 0.22102737426757812, 0.2292633056640625, 0.23749923706054688, 0.24573516845703125, 0.2539710998535156, 0.26220703125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 4.0, 2.0, 2.0, 7.0, 1.0, 4.0, 8.0, 9.0, 8.0, 15.0, 10.0, 20.0, 20.0, 16.0, 27.0, 38.0, 35.0, 40.0, 38.0, 43.0, 35.0, 46.0, 38.0, 45.0, 58.0, 42.0, 49.0, 39.0, 32.0, 27.0, 40.0, 30.0, 38.0, 22.0, 22.0, 10.0, 18.0, 10.0, 10.0, 11.0, 11.0, 5.0, 6.0, 3.0, 3.0, 5.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.362548828125, -0.35205078125, -0.341552734375, -0.3310546875, -0.320556640625, -0.31005859375, -0.299560546875, -0.2890625, -0.278564453125, -0.26806640625, -0.257568359375, -0.2470703125, -0.236572265625, -0.22607421875, -0.215576171875, -0.205078125, -0.194580078125, -0.18408203125, -0.173583984375, -0.1630859375, -0.152587890625, -0.14208984375, -0.131591796875, -0.12109375, -0.110595703125, -0.10009765625, -0.089599609375, -0.0791015625, -0.068603515625, -0.05810546875, -0.047607421875, -0.037109375, -0.026611328125, -0.01611328125, -0.005615234375, 0.0048828125, 0.015380859375, 0.02587890625, 0.036376953125, 0.046875, 0.057373046875, 0.06787109375, 0.078369140625, 0.0888671875, 0.099365234375, 0.10986328125, 0.120361328125, 0.130859375, 0.141357421875, 0.15185546875, 0.162353515625, 0.1728515625, 0.183349609375, 0.19384765625, 0.204345703125, 0.21484375, 0.225341796875, 0.23583984375, 0.246337890625, 0.2568359375, 0.267333984375, 0.27783203125, 0.288330078125, 0.298828125, 0.309326171875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 7.0, 5.0, 7.0, 17.0, 22.0, 40.0, 74.0, 140.0, 265.0, 651.0, 2247.0, 13589.0, 143328.0, 815074.0, 63788.0, 6966.0, 1401.0, 456.0, 214.0, 110.0, 58.0, 34.0, 12.0, 13.0, 9.0, 9.0, 10.0, 1.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1455078125, -0.1410083770751953, -0.13650894165039062, -0.13200950622558594, -0.12751007080078125, -0.12301063537597656, -0.11851119995117188, -0.11401176452636719, -0.1095123291015625, -0.10501289367675781, -0.10051345825195312, -0.09601402282714844, -0.09151458740234375, -0.08701515197753906, -0.08251571655273438, -0.07801628112792969, -0.073516845703125, -0.06901741027832031, -0.06451797485351562, -0.06001853942871094, -0.05551910400390625, -0.05101966857910156, -0.046520233154296875, -0.04202079772949219, -0.0375213623046875, -0.03302192687988281, -0.028522491455078125, -0.024023056030273438, -0.01952362060546875, -0.015024185180664062, -0.010524749755859375, -0.0060253143310546875, -0.00152587890625, 0.0029735565185546875, 0.007472991943359375, 0.011972427368164062, 0.01647186279296875, 0.020971298217773438, 0.025470733642578125, 0.029970169067382812, 0.0344696044921875, 0.03896903991699219, 0.043468475341796875, 0.04796791076660156, 0.05246734619140625, 0.05696678161621094, 0.061466217041015625, 0.06596565246582031, 0.070465087890625, 0.07496452331542969, 0.07946395874023438, 0.08396339416503906, 0.08846282958984375, 0.09296226501464844, 0.09746170043945312, 0.10196113586425781, 0.1064605712890625, 0.11096000671386719, 0.11545944213867188, 0.11995887756347656, 0.12445831298828125, 0.12895774841308594, 0.13345718383789062, 0.1379566192626953, 0.1424560546875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 5.0, 2.0, 5.0, 6.0, 7.0, 12.0, 15.0, 10.0, 12.0, 14.0, 23.0, 26.0, 33.0, 62.0, 74.0, 89.0, 112.0, 99.0, 112.0, 69.0, 39.0, 36.0, 37.0, 10.0, 22.0, 11.0, 7.0, 12.0, 10.0, 10.0, 8.0, 6.0, 3.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.069110870361328e-05, -6.807222962379456e-05, -6.545335054397583e-05, -6.28344714641571e-05, -6.021559238433838e-05, -5.759671330451965e-05, -5.497783422470093e-05, -5.23589551448822e-05, -4.9740076065063477e-05, -4.712119698524475e-05, -4.4502317905426025e-05, -4.18834388256073e-05, -3.9264559745788574e-05, -3.664568066596985e-05, -3.402680158615112e-05, -3.14079225063324e-05, -2.8789043426513672e-05, -2.6170164346694946e-05, -2.355128526687622e-05, -2.0932406187057495e-05, -1.831352710723877e-05, -1.5694648027420044e-05, -1.3075768947601318e-05, -1.0456889867782593e-05, -7.838010787963867e-06, -5.219131708145142e-06, -2.600252628326416e-06, 1.862645149230957e-08, 2.637505531311035e-06, 5.256384611129761e-06, 7.875263690948486e-06, 1.0494142770767212e-05, 1.3113021850585938e-05, 1.5731900930404663e-05, 1.835078001022339e-05, 2.0969659090042114e-05, 2.358853816986084e-05, 2.6207417249679565e-05, 2.882629632949829e-05, 3.1445175409317017e-05, 3.406405448913574e-05, 3.668293356895447e-05, 3.930181264877319e-05, 4.192069172859192e-05, 4.4539570808410645e-05, 4.715844988822937e-05, 4.9777328968048096e-05, 5.239620804786682e-05, 5.501508712768555e-05, 5.763396620750427e-05, 6.0252845287323e-05, 6.287172436714172e-05, 6.549060344696045e-05, 6.810948252677917e-05, 7.07283616065979e-05, 7.334724068641663e-05, 7.596611976623535e-05, 7.858499884605408e-05, 8.12038779258728e-05, 8.382275700569153e-05, 8.644163608551025e-05, 8.906051516532898e-05, 9.16793942451477e-05, 9.429827332496643e-05, 9.691715240478516e-05]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 7.0, 3.0, 7.0, 8.0, 12.0, 23.0, 34.0, 47.0, 85.0, 142.0, 228.0, 373.0, 792.0, 2424.0, 12623.0, 89913.0, 781210.0, 137081.0, 18314.0, 3200.0, 955.0, 463.0, 223.0, 161.0, 78.0, 57.0, 32.0, 21.0, 13.0, 7.0, 8.0, 3.0, 4.0, 3.0, 5.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11505126953125, -0.11088275909423828, -0.10671424865722656, -0.10254573822021484, -0.09837722778320312, -0.0942087173461914, -0.09004020690917969, -0.08587169647216797, -0.08170318603515625, -0.07753467559814453, -0.07336616516113281, -0.0691976547241211, -0.06502914428710938, -0.060860633850097656, -0.05669212341308594, -0.05252361297607422, -0.0483551025390625, -0.04418659210205078, -0.04001808166503906, -0.035849571228027344, -0.031681060791015625, -0.027512550354003906, -0.023344039916992188, -0.01917552947998047, -0.01500701904296875, -0.010838508605957031, -0.0066699981689453125, -0.0025014877319335938, 0.001667022705078125, 0.005835533142089844, 0.010004043579101562, 0.014172554016113281, 0.018341064453125, 0.02250957489013672, 0.026678085327148438, 0.030846595764160156, 0.035015106201171875, 0.039183616638183594, 0.04335212707519531, 0.04752063751220703, 0.05168914794921875, 0.05585765838623047, 0.06002616882324219, 0.0641946792602539, 0.06836318969726562, 0.07253170013427734, 0.07670021057128906, 0.08086872100830078, 0.0850372314453125, 0.08920574188232422, 0.09337425231933594, 0.09754276275634766, 0.10171127319335938, 0.1058797836303711, 0.11004829406738281, 0.11421680450439453, 0.11838531494140625, 0.12255382537841797, 0.1267223358154297, 0.1308908462524414, 0.13505935668945312, 0.13922786712646484, 0.14339637756347656, 0.14756488800048828, 0.1517333984375]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 13.0, 14.0, 11.0, 19.0, 28.0, 37.0, 33.0, 59.0, 75.0, 122.0, 167.0, 148.0, 84.0, 48.0, 41.0, 32.0, 24.0, 17.0, 4.0, 10.0, 11.0, 4.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1395263671875, -0.1362628936767578, -0.13299942016601562, -0.12973594665527344, -0.12647247314453125, -0.12320899963378906, -0.11994552612304688, -0.11668205261230469, -0.1134185791015625, -0.11015510559082031, -0.10689163208007812, -0.10362815856933594, -0.10036468505859375, -0.09710121154785156, -0.09383773803710938, -0.09057426452636719, -0.087310791015625, -0.08404731750488281, -0.08078384399414062, -0.07752037048339844, -0.07425689697265625, -0.07099342346191406, -0.06772994995117188, -0.06446647644042969, -0.0612030029296875, -0.05793952941894531, -0.054676055908203125, -0.05141258239746094, -0.04814910888671875, -0.04488563537597656, -0.041622161865234375, -0.03835868835449219, -0.03509521484375, -0.03183174133300781, -0.028568267822265625, -0.025304794311523438, -0.02204132080078125, -0.018777847290039062, -0.015514373779296875, -0.012250900268554688, -0.0089874267578125, -0.0057239532470703125, -0.002460479736328125, 0.0008029937744140625, 0.00406646728515625, 0.0073299407958984375, 0.010593414306640625, 0.013856887817382812, 0.017120361328125, 0.020383834838867188, 0.023647308349609375, 0.026910781860351562, 0.03017425537109375, 0.03343772888183594, 0.036701202392578125, 0.03996467590332031, 0.0432281494140625, 0.04649162292480469, 0.049755096435546875, 0.05301856994628906, 0.05628204345703125, 0.05954551696777344, 0.06280899047851562, 0.06607246398925781, 0.0693359375]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 3.0, 9.0, 44.0, 143.0, 369.0, 310.0, 99.0, 21.0, 9.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6809935569763184, -3.5433645248413086, -3.405735731124878, -3.2681069374084473, -3.1304779052734375, -2.9928488731384277, -2.855220079421997, -2.7175912857055664, -2.5799622535705566, -2.442333221435547, -2.304704427719116, -2.1670756340026855, -2.029446601867676, -1.8918176889419556, -1.7541887760162354, -1.6165598630905151, -1.478930950164795, -1.3413020372390747, -1.2036731243133545, -1.0660442113876343, -0.9284152984619141, -0.7907863855361938, -0.6531574726104736, -0.5155285596847534, -0.3778996467590332, -0.240270733833313, -0.10264182090759277, 0.03498709201812744, 0.17261600494384766, 0.31024491786956787, 0.4478738307952881, 0.5855027437210083, 0.7231311798095703, 0.8607600927352905, 0.9983890056610107, 1.136017918586731, 1.2736468315124512, 1.4112757444381714, 1.5489046573638916, 1.6865335702896118, 1.824162483215332, 1.9617913961410522, 2.0994203090667725, 2.237049102783203, 2.374678134918213, 2.5123071670532227, 2.6499359607696533, 2.787564754486084, 2.9251937866210938, 3.0628228187561035, 3.200451612472534, 3.338080406188965, 3.4757094383239746, 3.6133384704589844, 3.750967264175415, 3.8885960578918457, 4.0262250900268555, 4.163854122161865, 4.301483154296875, 4.439111709594727, 4.576740741729736, 4.714369773864746, 4.851998329162598, 4.989627361297607, 5.127256393432617]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 4.0, 5.0, 2.0, 0.0, 8.0, 10.0, 14.0, 15.0, 8.0, 16.0, 14.0, 17.0, 18.0, 26.0, 34.0, 28.0, 29.0, 33.0, 39.0, 41.0, 29.0, 46.0, 47.0, 33.0, 32.0, 53.0, 36.0, 43.0, 39.0, 38.0, 27.0, 33.0, 26.0, 23.0, 17.0, 28.0, 19.0, 17.0, 12.0, 11.0, 7.0, 4.0, 8.0, 3.0, 3.0, 6.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.3635234832763672, -1.3164212703704834, -1.26931893825531, -1.2222166061401367, -1.175114393234253, -1.1280121803283691, -1.0809098482131958, -1.0338075160980225, -0.9867053031921387, -0.9396030306816101, -0.8925007581710815, -0.845398485660553, -0.7982962131500244, -0.7511939406394958, -0.7040916681289673, -0.6569893956184387, -0.6098871231079102, -0.5627848505973816, -0.515682578086853, -0.46858030557632446, -0.4214780330657959, -0.37437576055526733, -0.32727348804473877, -0.2801712155342102, -0.23306894302368164, -0.18596667051315308, -0.1388643980026245, -0.09176212549209595, -0.04465985298156738, 0.0024424195289611816, 0.049544692039489746, 0.09664696455001831, 0.14374923706054688, 0.19085150957107544, 0.237953782081604, 0.28505605459213257, 0.33215832710266113, 0.3792605996131897, 0.42636287212371826, 0.4734651446342468, 0.5205674171447754, 0.567669689655304, 0.6147719621658325, 0.6618742346763611, 0.7089765071868896, 0.7560787796974182, 0.8031810522079468, 0.8502833247184753, 0.8973855972290039, 0.9444878697395325, 0.991590142250061, 1.0386924743652344, 1.0857946872711182, 1.132896900177002, 1.1799992322921753, 1.2271015644073486, 1.2742037773132324, 1.3213059902191162, 1.3684083223342896, 1.415510654449463, 1.4626128673553467, 1.5097150802612305, 1.5568174123764038, 1.6039197444915771, 1.651021957397461]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 6.0, 9.0, 11.0, 18.0, 15.0, 24.0, 37.0, 64.0, 100.0, 146.0, 211.0, 372.0, 668.0, 1313.0, 2902.0, 7368.0, 28182.0, 323720.0, 3737338.0, 70011.0, 13447.0, 4446.0, 1812.0, 869.0, 475.0, 247.0, 132.0, 99.0, 73.0, 41.0, 24.0, 22.0, 18.0, 7.0, 20.0, 6.0, 4.0, 9.0, 5.0, 4.0, 4.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.315673828125, -0.30449676513671875, -0.2933197021484375, -0.28214263916015625, -0.270965576171875, -0.25978851318359375, -0.2486114501953125, -0.23743438720703125, -0.22625732421875, -0.21508026123046875, -0.2039031982421875, -0.19272613525390625, -0.181549072265625, -0.17037200927734375, -0.1591949462890625, -0.14801788330078125, -0.1368408203125, -0.12566375732421875, -0.1144866943359375, -0.10330963134765625, -0.092132568359375, -0.08095550537109375, -0.0697784423828125, -0.05860137939453125, -0.04742431640625, -0.03624725341796875, -0.0250701904296875, -0.01389312744140625, -0.002716064453125, 0.00846099853515625, 0.0196380615234375, 0.03081512451171875, 0.0419921875, 0.05316925048828125, 0.0643463134765625, 0.07552337646484375, 0.086700439453125, 0.09787750244140625, 0.1090545654296875, 0.12023162841796875, 0.13140869140625, 0.14258575439453125, 0.1537628173828125, 0.16493988037109375, 0.176116943359375, 0.18729400634765625, 0.1984710693359375, 0.20964813232421875, 0.2208251953125, 0.23200225830078125, 0.2431793212890625, 0.25435638427734375, 0.265533447265625, 0.27671051025390625, 0.2878875732421875, 0.29906463623046875, 0.31024169921875, 0.32141876220703125, 0.3325958251953125, 0.34377288818359375, 0.354949951171875, 0.36612701416015625, 0.3773040771484375, 0.38848114013671875, 0.399658203125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 4.0, 2.0, 7.0, 2.0, 13.0, 8.0, 15.0, 32.0, 41.0, 64.0, 74.0, 102.0, 81.0, 127.0, 99.0, 88.0, 76.0, 50.0, 37.0, 29.0, 23.0, 10.0, 7.0, 5.0, 6.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1435546875, -0.1379108428955078, -0.13226699829101562, -0.12662315368652344, -0.12097930908203125, -0.11533546447753906, -0.10969161987304688, -0.10404777526855469, -0.0984039306640625, -0.09276008605957031, -0.08711624145507812, -0.08147239685058594, -0.07582855224609375, -0.07018470764160156, -0.06454086303710938, -0.05889701843261719, -0.053253173828125, -0.04760932922363281, -0.041965484619140625, -0.03632164001464844, -0.03067779541015625, -0.025033950805664062, -0.019390106201171875, -0.013746261596679688, -0.0081024169921875, -0.0024585723876953125, 0.003185272216796875, 0.008829116821289062, 0.01447296142578125, 0.020116806030273438, 0.025760650634765625, 0.03140449523925781, 0.03704833984375, 0.04269218444824219, 0.048336029052734375, 0.05397987365722656, 0.05962371826171875, 0.06526756286621094, 0.07091140747070312, 0.07655525207519531, 0.0821990966796875, 0.08784294128417969, 0.09348678588867188, 0.09913063049316406, 0.10477447509765625, 0.11041831970214844, 0.11606216430664062, 0.12170600891113281, 0.127349853515625, 0.1329936981201172, 0.13863754272460938, 0.14428138732910156, 0.14992523193359375, 0.15556907653808594, 0.16121292114257812, 0.1668567657470703, 0.1725006103515625, 0.1781444549560547, 0.18378829956054688, 0.18943214416503906, 0.19507598876953125, 0.20071983337402344, 0.20636367797851562, 0.2120075225830078, 0.2176513671875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 7.0, 9.0, 12.0, 13.0, 23.0, 46.0, 77.0, 77.0, 129.0, 209.0, 353.0, 524.0, 928.0, 1604.0, 3030.0, 6791.0, 19666.0, 88169.0, 2359282.0, 1602550.0, 79159.0, 18520.0, 6589.0, 2831.0, 1477.0, 839.0, 491.0, 311.0, 205.0, 141.0, 81.0, 49.0, 29.0, 22.0, 20.0, 9.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.231201171875, -0.2249469757080078, -0.21869277954101562, -0.21243858337402344, -0.20618438720703125, -0.19993019104003906, -0.19367599487304688, -0.1874217987060547, -0.1811676025390625, -0.1749134063720703, -0.16865921020507812, -0.16240501403808594, -0.15615081787109375, -0.14989662170410156, -0.14364242553710938, -0.1373882293701172, -0.131134033203125, -0.12487983703613281, -0.11862564086914062, -0.11237144470214844, -0.10611724853515625, -0.09986305236816406, -0.09360885620117188, -0.08735466003417969, -0.0811004638671875, -0.07484626770019531, -0.06859207153320312, -0.06233787536621094, -0.05608367919921875, -0.04982948303222656, -0.043575286865234375, -0.03732109069824219, -0.03106689453125, -0.024812698364257812, -0.018558502197265625, -0.012304306030273438, -0.00605010986328125, 0.0002040863037109375, 0.006458282470703125, 0.012712478637695312, 0.0189666748046875, 0.025220870971679688, 0.031475067138671875, 0.03772926330566406, 0.04398345947265625, 0.05023765563964844, 0.056491851806640625, 0.06274604797363281, 0.069000244140625, 0.07525444030761719, 0.08150863647460938, 0.08776283264160156, 0.09401702880859375, 0.10027122497558594, 0.10652542114257812, 0.11277961730957031, 0.1190338134765625, 0.1252880096435547, 0.13154220581054688, 0.13779640197753906, 0.14405059814453125, 0.15030479431152344, 0.15655899047851562, 0.1628131866455078, 0.1690673828125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 6.0, 1.0, 6.0, 3.0, 10.0, 12.0, 20.0, 25.0, 52.0, 86.0, 249.0, 711.0, 1926.0, 551.0, 184.0, 82.0, 43.0, 33.0, 21.0, 13.0, 7.0, 13.0, 4.0, 0.0, 7.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.11767578125, -0.11425304412841797, -0.11083030700683594, -0.1074075698852539, -0.10398483276367188, -0.10056209564208984, -0.09713935852050781, -0.09371662139892578, -0.09029388427734375, -0.08687114715576172, -0.08344841003417969, -0.08002567291259766, -0.07660293579101562, -0.0731801986694336, -0.06975746154785156, -0.06633472442626953, -0.0629119873046875, -0.05948925018310547, -0.05606651306152344, -0.052643775939941406, -0.049221038818359375, -0.045798301696777344, -0.04237556457519531, -0.03895282745361328, -0.03553009033203125, -0.03210735321044922, -0.028684616088867188, -0.025261878967285156, -0.021839141845703125, -0.018416404724121094, -0.014993667602539062, -0.011570930480957031, -0.008148193359375, -0.004725456237792969, -0.0013027191162109375, 0.0021200180053710938, 0.005542755126953125, 0.008965492248535156, 0.012388229370117188, 0.01581096649169922, 0.01923370361328125, 0.02265644073486328, 0.026079177856445312, 0.029501914978027344, 0.032924652099609375, 0.036347389221191406, 0.03977012634277344, 0.04319286346435547, 0.0466156005859375, 0.05003833770751953, 0.05346107482910156, 0.056883811950683594, 0.060306549072265625, 0.06372928619384766, 0.06715202331542969, 0.07057476043701172, 0.07399749755859375, 0.07742023468017578, 0.08084297180175781, 0.08426570892333984, 0.08768844604492188, 0.0911111831665039, 0.09453392028808594, 0.09795665740966797, 0.10137939453125]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 7.0, 9.0, 17.0, 37.0, 100.0, 155.0, 193.0, 189.0, 142.0, 78.0, 29.0, 19.0, 11.0, 7.0, 2.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8660962581634521, -0.8459039330482483, -0.8257116079330444, -0.8055192828178406, -0.7853269577026367, -0.7651346325874329, -0.744942307472229, -0.7247500419616699, -0.7045576572418213, -0.6843653321266174, -0.6641730070114136, -0.6439806818962097, -0.6237883567810059, -0.603596031665802, -0.5834037065505981, -0.5632114410400391, -0.5430191159248352, -0.5228267908096313, -0.5026344656944275, -0.48244214057922363, -0.4622498154640198, -0.4420574903488159, -0.42186519503593445, -0.4016728699207306, -0.38148054480552673, -0.3612882196903229, -0.341095894575119, -0.32090356945991516, -0.3007112741470337, -0.28051894903182983, -0.260326623916626, -0.24013429880142212, -0.21994197368621826, -0.1997496485710144, -0.17955732345581055, -0.15936501324176788, -0.13917268812656403, -0.11898036301136017, -0.09878804534673691, -0.07859572768211365, -0.05840340256690979, -0.03821108117699623, -0.018018759787082672, 0.002173561602830887, 0.022365882992744446, 0.0425582081079483, 0.06275052577257156, 0.08294284343719482, 0.10313516855239868, 0.12332749366760254, 0.1435198187828064, 0.16371212899684906, 0.18390445411205292, 0.20409677922725677, 0.22428908944129944, 0.2444814145565033, 0.26467373967170715, 0.284866064786911, 0.30505838990211487, 0.3252507150173187, 0.3454430103302002, 0.36563533544540405, 0.3858276605606079, 0.40601998567581177, 0.4262123107910156]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 7.0, 6.0, 10.0, 19.0, 17.0, 20.0, 19.0, 38.0, 33.0, 32.0, 34.0, 34.0, 46.0, 34.0, 54.0, 49.0, 56.0, 55.0, 44.0, 45.0, 41.0, 47.0, 40.0, 31.0, 24.0, 32.0, 26.0, 17.0, 26.0, 16.0, 9.0, 12.0, 5.0, 6.0, 10.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.36335307359695435, -0.3531562387943268, -0.3429594039916992, -0.33276256918907166, -0.3225657343864441, -0.3123689293861389, -0.30217209458351135, -0.2919752597808838, -0.2817784249782562, -0.27158159017562866, -0.2613847553730011, -0.25118792057037354, -0.24099110066890717, -0.2307942658662796, -0.22059744596481323, -0.21040061116218567, -0.2002037763595581, -0.19000694155693054, -0.17981010675430298, -0.1696132868528366, -0.15941645205020905, -0.14921961724758148, -0.1390227973461151, -0.12882596254348755, -0.11862912774085999, -0.10843229293823242, -0.09823546558618546, -0.08803863823413849, -0.07784180343151093, -0.06764496862888336, -0.057448141276836395, -0.04725131392478943, -0.037054479122161865, -0.0268576480448246, -0.016660816967487335, -0.00646398589015007, 0.003732845187187195, 0.01392967626452446, 0.024126507341861725, 0.03432333469390869, 0.044520169496536255, 0.05471700057387352, 0.06491383165121078, 0.07511065900325775, 0.08530749380588531, 0.09550432860851288, 0.10570115596055984, 0.11589798331260681, 0.12609481811523438, 0.13629165291786194, 0.1464884877204895, 0.15668530762195587, 0.16688214242458344, 0.177078977227211, 0.18727579712867737, 0.19747263193130493, 0.2076694667339325, 0.21786630153656006, 0.22806313633918762, 0.238259956240654, 0.24845679104328156, 0.2586536109447479, 0.2688504457473755, 0.27904728055000305, 0.2892441153526306]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 8.0, 9.0, 3.0, 13.0, 19.0, 45.0, 95.0, 171.0, 323.0, 746.0, 2142.0, 9894.0, 111795.0, 828640.0, 83116.0, 8316.0, 1941.0, 643.0, 301.0, 156.0, 80.0, 41.0, 15.0, 14.0, 14.0, 5.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.5654296875, -0.5455551147460938, -0.5256805419921875, -0.5058059692382812, -0.485931396484375, -0.46605682373046875, -0.4461822509765625, -0.42630767822265625, -0.40643310546875, -0.38655853271484375, -0.3666839599609375, -0.34680938720703125, -0.326934814453125, -0.30706024169921875, -0.2871856689453125, -0.26731109619140625, -0.2474365234375, -0.22756195068359375, -0.2076873779296875, -0.18781280517578125, -0.167938232421875, -0.14806365966796875, -0.1281890869140625, -0.10831451416015625, -0.08843994140625, -0.06856536865234375, -0.0486907958984375, -0.02881622314453125, -0.008941650390625, 0.01093292236328125, 0.0308074951171875, 0.05068206787109375, 0.070556640625, 0.09043121337890625, 0.1103057861328125, 0.13018035888671875, 0.150054931640625, 0.16992950439453125, 0.1898040771484375, 0.20967864990234375, 0.22955322265625, 0.24942779541015625, 0.2693023681640625, 0.28917694091796875, 0.309051513671875, 0.32892608642578125, 0.3488006591796875, 0.36867523193359375, 0.3885498046875, 0.40842437744140625, 0.4282989501953125, 0.44817352294921875, 0.468048095703125, 0.48792266845703125, 0.5077972412109375, 0.5276718139648438, 0.54754638671875, 0.5674209594726562, 0.5872955322265625, 0.6071701049804688, 0.627044677734375, 0.6469192504882812, 0.6667938232421875, 0.6866683959960938, 0.70654296875]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 4.0, 3.0, 11.0, 15.0, 18.0, 33.0, 37.0, 76.0, 78.0, 107.0, 85.0, 126.0, 111.0, 65.0, 75.0, 50.0, 36.0, 19.0, 20.0, 9.0, 9.0, 6.0, 1.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1466064453125, -0.14100074768066406, -0.13539505004882812, -0.1297893524169922, -0.12418365478515625, -0.11857795715332031, -0.11297225952148438, -0.10736656188964844, -0.1017608642578125, -0.09615516662597656, -0.09054946899414062, -0.08494377136230469, -0.07933807373046875, -0.07373237609863281, -0.06812667846679688, -0.06252098083496094, -0.056915283203125, -0.05130958557128906, -0.045703887939453125, -0.04009819030761719, -0.03449249267578125, -0.028886795043945312, -0.023281097412109375, -0.017675399780273438, -0.0120697021484375, -0.0064640045166015625, -0.000858306884765625, 0.0047473907470703125, 0.01035308837890625, 0.015958786010742188, 0.021564483642578125, 0.027170181274414062, 0.03277587890625, 0.03838157653808594, 0.043987274169921875, 0.04959297180175781, 0.05519866943359375, 0.06080436706542969, 0.06641006469726562, 0.07201576232910156, 0.0776214599609375, 0.08322715759277344, 0.08883285522460938, 0.09443855285644531, 0.10004425048828125, 0.10564994812011719, 0.11125564575195312, 0.11686134338378906, 0.122467041015625, 0.12807273864746094, 0.13367843627929688, 0.1392841339111328, 0.14488983154296875, 0.1504955291748047, 0.15610122680664062, 0.16170692443847656, 0.1673126220703125, 0.17291831970214844, 0.17852401733398438, 0.1841297149658203, 0.18973541259765625, 0.1953411102294922, 0.20094680786132812, 0.20655250549316406, 0.212158203125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 5.0, 4.0, 4.0, 8.0, 9.0, 15.0, 28.0, 43.0, 46.0, 94.0, 134.0, 246.0, 456.0, 902.0, 2213.0, 7237.0, 29225.0, 170920.0, 646858.0, 152599.0, 26714.0, 6617.0, 2252.0, 868.0, 461.0, 270.0, 125.0, 66.0, 40.0, 43.0, 21.0, 13.0, 10.0, 4.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.261962890625, -0.251678466796875, -0.24139404296875, -0.231109619140625, -0.2208251953125, -0.210540771484375, -0.20025634765625, -0.189971923828125, -0.1796875, -0.169403076171875, -0.15911865234375, -0.148834228515625, -0.1385498046875, -0.128265380859375, -0.11798095703125, -0.107696533203125, -0.097412109375, -0.087127685546875, -0.07684326171875, -0.066558837890625, -0.0562744140625, -0.045989990234375, -0.03570556640625, -0.025421142578125, -0.01513671875, -0.004852294921875, 0.00543212890625, 0.015716552734375, 0.0260009765625, 0.036285400390625, 0.04656982421875, 0.056854248046875, 0.067138671875, 0.077423095703125, 0.08770751953125, 0.097991943359375, 0.1082763671875, 0.118560791015625, 0.12884521484375, 0.139129638671875, 0.1494140625, 0.159698486328125, 0.16998291015625, 0.180267333984375, 0.1905517578125, 0.200836181640625, 0.21112060546875, 0.221405029296875, 0.231689453125, 0.241973876953125, 0.25225830078125, 0.262542724609375, 0.2728271484375, 0.283111572265625, 0.29339599609375, 0.303680419921875, 0.31396484375, 0.324249267578125, 0.33453369140625, 0.344818115234375, 0.3551025390625, 0.365386962890625, 0.37567138671875, 0.385955810546875, 0.396240234375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 5.0, 4.0, 9.0, 8.0, 17.0, 17.0, 23.0, 27.0, 42.0, 49.0, 50.0, 59.0, 65.0, 57.0, 73.0, 86.0, 59.0, 70.0, 50.0, 49.0, 48.0, 39.0, 26.0, 17.0, 17.0, 11.0, 7.0, 6.0, 9.0, 5.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.421630859375, -0.4060401916503906, -0.39044952392578125, -0.3748588562011719, -0.3592681884765625, -0.3436775207519531, -0.32808685302734375, -0.3124961853027344, -0.296905517578125, -0.2813148498535156, -0.26572418212890625, -0.2501335144042969, -0.2345428466796875, -0.21895217895507812, -0.20336151123046875, -0.18777084350585938, -0.17218017578125, -0.15658950805664062, -0.14099884033203125, -0.12540817260742188, -0.1098175048828125, -0.09422683715820312, -0.07863616943359375, -0.06304550170898438, -0.047454833984375, -0.031864166259765625, -0.01627349853515625, -0.000682830810546875, 0.0149078369140625, 0.030498504638671875, 0.04608917236328125, 0.061679840087890625, 0.0772705078125, 0.09286117553710938, 0.10845184326171875, 0.12404251098632812, 0.1396331787109375, 0.15522384643554688, 0.17081451416015625, 0.18640518188476562, 0.201995849609375, 0.21758651733398438, 0.23317718505859375, 0.24876785278320312, 0.2643585205078125, 0.2799491882324219, 0.29553985595703125, 0.3111305236816406, 0.32672119140625, 0.3423118591308594, 0.35790252685546875, 0.3734931945800781, 0.3890838623046875, 0.4046745300292969, 0.42026519775390625, 0.4358558654785156, 0.451446533203125, 0.4670372009277344, 0.48262786865234375, 0.4982185363769531, 0.5138092041015625, 0.5293998718261719, 0.5449905395507812, 0.5605812072753906, 0.576171875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 5.0, 4.0, 7.0, 11.0, 18.0, 46.0, 79.0, 206.0, 395.0, 1094.0, 3888.0, 19345.0, 141634.0, 783081.0, 81574.0, 12900.0, 2797.0, 782.0, 342.0, 163.0, 93.0, 40.0, 18.0, 13.0, 6.0, 7.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0933837890625, -0.08997344970703125, -0.0865631103515625, -0.08315277099609375, -0.079742431640625, -0.07633209228515625, -0.0729217529296875, -0.06951141357421875, -0.06610107421875, -0.06269073486328125, -0.0592803955078125, -0.05587005615234375, -0.052459716796875, -0.04904937744140625, -0.0456390380859375, -0.04222869873046875, -0.038818359375, -0.03540802001953125, -0.0319976806640625, -0.02858734130859375, -0.025177001953125, -0.02176666259765625, -0.0183563232421875, -0.01494598388671875, -0.01153564453125, -0.00812530517578125, -0.0047149658203125, -0.00130462646484375, 0.002105712890625, 0.00551605224609375, 0.0089263916015625, 0.01233673095703125, 0.0157470703125, 0.01915740966796875, 0.0225677490234375, 0.02597808837890625, 0.029388427734375, 0.03279876708984375, 0.0362091064453125, 0.03961944580078125, 0.04302978515625, 0.04644012451171875, 0.0498504638671875, 0.05326080322265625, 0.056671142578125, 0.06008148193359375, 0.0634918212890625, 0.06690216064453125, 0.0703125, 0.07372283935546875, 0.0771331787109375, 0.08054351806640625, 0.083953857421875, 0.08736419677734375, 0.0907745361328125, 0.09418487548828125, 0.09759521484375, 0.10100555419921875, 0.1044158935546875, 0.10782623291015625, 0.111236572265625, 0.11464691162109375, 0.1180572509765625, 0.12146759033203125, 0.1248779296875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 7.0, 5.0, 7.0, 7.0, 18.0, 25.0, 31.0, 44.0, 85.0, 146.0, 159.0, 160.0, 116.0, 65.0, 52.0, 27.0, 21.0, 15.0, 11.0, 6.0, 3.0, 0.0, 2.0], "bins": [-0.00022041797637939453, -0.00021615158766508102, -0.00021188519895076752, -0.000207618810236454, -0.0002033524215221405, -0.000199086032807827, -0.0001948196440935135, -0.00019055325537919998, -0.00018628686666488647, -0.00018202047795057297, -0.00017775408923625946, -0.00017348770052194595, -0.00016922131180763245, -0.00016495492309331894, -0.00016068853437900543, -0.00015642214566469193, -0.00015215575695037842, -0.0001478893682360649, -0.0001436229795217514, -0.0001393565908074379, -0.0001350902020931244, -0.00013082381337881088, -0.00012655742466449738, -0.00012229103595018387, -0.00011802464723587036, -0.00011375825852155685, -0.00010949186980724335, -0.00010522548109292984, -0.00010095909237861633, -9.669270366430283e-05, -9.242631494998932e-05, -8.815992623567581e-05, -8.38935375213623e-05, -7.96271488070488e-05, -7.536076009273529e-05, -7.109437137842178e-05, -6.682798266410828e-05, -6.256159394979477e-05, -5.829520523548126e-05, -5.4028816521167755e-05, -4.976242780685425e-05, -4.549603909254074e-05, -4.1229650378227234e-05, -3.696326166391373e-05, -3.269687294960022e-05, -2.8430484235286713e-05, -2.4164095520973206e-05, -1.98977068066597e-05, -1.563131809234619e-05, -1.1364929378032684e-05, -7.098540663719177e-06, -2.83215194940567e-06, 1.434236764907837e-06, 5.700625479221344e-06, 9.967014193534851e-06, 1.4233402907848358e-05, 1.8499791622161865e-05, 2.2766180336475372e-05, 2.703256905078888e-05, 3.1298957765102386e-05, 3.5565346479415894e-05, 3.98317351937294e-05, 4.409812390804291e-05, 4.8364512622356415e-05, 5.263090133666992e-05]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 5.0, 5.0, 6.0, 7.0, 15.0, 29.0, 40.0, 37.0, 71.0, 141.0, 228.0, 411.0, 927.0, 1929.0, 4934.0, 14739.0, 51005.0, 309238.0, 552162.0, 79421.0, 21338.0, 6967.0, 2581.0, 1089.0, 547.0, 271.0, 130.0, 103.0, 66.0, 35.0, 36.0, 17.0, 7.0, 5.0, 3.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0762939453125, -0.07384490966796875, -0.0713958740234375, -0.06894683837890625, -0.066497802734375, -0.06404876708984375, -0.0615997314453125, -0.05915069580078125, -0.05670166015625, -0.05425262451171875, -0.0518035888671875, -0.04935455322265625, -0.046905517578125, -0.04445648193359375, -0.0420074462890625, -0.03955841064453125, -0.037109375, -0.03466033935546875, -0.0322113037109375, -0.02976226806640625, -0.027313232421875, -0.02486419677734375, -0.0224151611328125, -0.01996612548828125, -0.01751708984375, -0.01506805419921875, -0.0126190185546875, -0.01016998291015625, -0.007720947265625, -0.00527191162109375, -0.0028228759765625, -0.00037384033203125, 0.0020751953125, 0.00452423095703125, 0.0069732666015625, 0.00942230224609375, 0.011871337890625, 0.01432037353515625, 0.0167694091796875, 0.01921844482421875, 0.02166748046875, 0.02411651611328125, 0.0265655517578125, 0.02901458740234375, 0.031463623046875, 0.03391265869140625, 0.0363616943359375, 0.03881072998046875, 0.041259765625, 0.04370880126953125, 0.0461578369140625, 0.04860687255859375, 0.051055908203125, 0.05350494384765625, 0.0559539794921875, 0.05840301513671875, 0.06085205078125, 0.06330108642578125, 0.0657501220703125, 0.06819915771484375, 0.070648193359375, 0.07309722900390625, 0.0755462646484375, 0.07799530029296875, 0.0804443359375]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 4.0, 1.0, 3.0, 3.0, 7.0, 9.0, 12.0, 10.0, 17.0, 26.0, 23.0, 52.0, 62.0, 80.0, 84.0, 108.0, 102.0, 89.0, 71.0, 57.0, 47.0, 25.0, 21.0, 25.0, 15.0, 10.0, 13.0, 6.0, 7.0, 4.0, 4.0, 3.0, 4.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07586669921875, -0.07362937927246094, -0.07139205932617188, -0.06915473937988281, -0.06691741943359375, -0.06468009948730469, -0.062442779541015625, -0.06020545959472656, -0.0579681396484375, -0.05573081970214844, -0.053493499755859375, -0.05125617980957031, -0.04901885986328125, -0.04678153991699219, -0.044544219970703125, -0.04230690002441406, -0.040069580078125, -0.03783226013183594, -0.035594940185546875, -0.03335762023925781, -0.03112030029296875, -0.028882980346679688, -0.026645660400390625, -0.024408340454101562, -0.0221710205078125, -0.019933700561523438, -0.017696380615234375, -0.015459060668945312, -0.01322174072265625, -0.010984420776367188, -0.008747100830078125, -0.0065097808837890625, -0.0042724609375, -0.0020351409912109375, 0.000202178955078125, 0.0024394989013671875, 0.00467681884765625, 0.0069141387939453125, 0.009151458740234375, 0.011388778686523438, 0.0136260986328125, 0.015863418579101562, 0.018100738525390625, 0.020338058471679688, 0.02257537841796875, 0.024812698364257812, 0.027050018310546875, 0.029287338256835938, 0.031524658203125, 0.03376197814941406, 0.035999298095703125, 0.03823661804199219, 0.04047393798828125, 0.04271125793457031, 0.044948577880859375, 0.04718589782714844, 0.0494232177734375, 0.05166053771972656, 0.053897857666015625, 0.05613517761230469, 0.05837249755859375, 0.06060981750488281, 0.06284713745117188, 0.06508445739746094, 0.06732177734375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 20.0, 54.0, 149.0, 318.0, 287.0, 129.0, 38.0, 8.0, 3.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.373222827911377, -4.260837078094482, -4.14845085144043, -4.036065101623535, -3.9236793518066406, -3.811293363571167, -3.6989073753356934, -3.586521625518799, -3.4741358757019043, -3.3617498874664307, -3.249364137649536, -3.1369781494140625, -3.024592399597168, -2.9122064113616943, -2.7998204231262207, -2.687434673309326, -2.5750486850738525, -2.462662696838379, -2.3502769470214844, -2.2378909587860107, -2.125505208969116, -2.0131192207336426, -1.9007333517074585, -1.7883474826812744, -1.6759616136550903, -1.5635757446289062, -1.4511898756027222, -1.338804006576538, -1.2264180183410645, -1.11403226852417, -1.0016462802886963, -0.8892604112625122, -0.7768745422363281, -0.664488673210144, -0.55210280418396, -0.4397168755531311, -0.327331006526947, -0.21494513750076294, -0.10255920886993408, 0.00982666015625, 0.12221252918243408, 0.23459841310977936, 0.34698429703712463, 0.4593701958656311, 0.5717560648918152, 0.6841419339179993, 0.7965278625488281, 0.9089137315750122, 1.0212996006011963, 1.1336854696273804, 1.2460713386535645, 1.358457326889038, 1.4708430767059326, 1.5832290649414062, 1.6956149339675903, 1.8080008029937744, 1.9203866720199585, 2.0327725410461426, 2.145158529281616, 2.2575442790985107, 2.3699302673339844, 2.482316017150879, 2.5947020053863525, 2.707087993621826, 2.8194737434387207]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 7.0, 3.0, 1.0, 12.0, 4.0, 10.0, 8.0, 8.0, 14.0, 15.0, 18.0, 21.0, 27.0, 36.0, 23.0, 30.0, 26.0, 38.0, 45.0, 33.0, 50.0, 44.0, 45.0, 44.0, 50.0, 45.0, 40.0, 40.0, 42.0, 40.0, 25.0, 18.0, 24.0, 19.0, 15.0, 19.0, 11.0, 9.0, 13.0, 4.0, 4.0, 5.0, 4.0, 3.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.3927788734436035, -1.3483463525772095, -1.3039138317108154, -1.2594811916351318, -1.2150486707687378, -1.1706161499023438, -1.1261836290359497, -1.0817511081695557, -1.037318468093872, -0.992885947227478, -0.9484533667564392, -0.9040208458900452, -0.8595882654190063, -0.8151557445526123, -0.7707232236862183, -0.7262907028198242, -0.6818581819534302, -0.6374256610870361, -0.5929930806159973, -0.5485605597496033, -0.5041279792785645, -0.4596954584121704, -0.41526293754577637, -0.37083038687705994, -0.3263978362083435, -0.2819652855396271, -0.23753274977207184, -0.1931002140045166, -0.14866766333580017, -0.10423511266708374, -0.0598025918006897, -0.015370041131973267, 0.029062509536743164, 0.073495052754879, 0.11792759597301483, 0.16236013174057007, 0.2067926824092865, 0.25122523307800293, 0.295657753944397, 0.3400903046131134, 0.38452285528182983, 0.42895540595054626, 0.4733879566192627, 0.5178204774856567, 0.5622529983520508, 0.6066855788230896, 0.6511180996894836, 0.6955506801605225, 0.7399832010269165, 0.7844157218933105, 0.8288483023643494, 0.8732808232307434, 0.9177134037017822, 0.9621459245681763, 1.0065784454345703, 1.0510109663009644, 1.0954434871673584, 1.1398760080337524, 1.1843085289001465, 1.22874116897583, 1.2731736898422241, 1.3176062107086182, 1.3620387315750122, 1.4064712524414062, 1.4509038925170898]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 10.0, 8.0, 14.0, 7.0, 13.0, 22.0, 26.0, 65.0, 98.0, 166.0, 343.0, 592.0, 1334.0, 3523.0, 14892.0, 200875.0, 3921950.0, 39910.0, 6636.0, 2021.0, 808.0, 378.0, 221.0, 142.0, 77.0, 51.0, 29.0, 22.0, 13.0, 7.0, 6.0, 5.0, 10.0, 0.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0], "bins": [-0.61767578125, -0.5990982055664062, -0.5805206298828125, -0.5619430541992188, -0.543365478515625, -0.5247879028320312, -0.5062103271484375, -0.48763275146484375, -0.46905517578125, -0.45047760009765625, -0.4319000244140625, -0.41332244873046875, -0.394744873046875, -0.37616729736328125, -0.3575897216796875, -0.33901214599609375, -0.3204345703125, -0.30185699462890625, -0.2832794189453125, -0.26470184326171875, -0.246124267578125, -0.22754669189453125, -0.2089691162109375, -0.19039154052734375, -0.17181396484375, -0.15323638916015625, -0.1346588134765625, -0.11608123779296875, -0.097503662109375, -0.07892608642578125, -0.0603485107421875, -0.04177093505859375, -0.023193359375, -0.00461578369140625, 0.0139617919921875, 0.03253936767578125, 0.051116943359375, 0.06969451904296875, 0.0882720947265625, 0.10684967041015625, 0.12542724609375, 0.14400482177734375, 0.1625823974609375, 0.18115997314453125, 0.199737548828125, 0.21831512451171875, 0.2368927001953125, 0.25547027587890625, 0.2740478515625, 0.29262542724609375, 0.3112030029296875, 0.32978057861328125, 0.348358154296875, 0.36693572998046875, 0.3855133056640625, 0.40409088134765625, 0.42266845703125, 0.44124603271484375, 0.4598236083984375, 0.47840118408203125, 0.496978759765625, 0.5155563354492188, 0.5341339111328125, 0.5527114868164062, 0.5712890625]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 4.0, 10.0, 11.0, 10.0, 22.0, 37.0, 44.0, 72.0, 90.0, 97.0, 96.0, 119.0, 91.0, 77.0, 66.0, 46.0, 33.0, 25.0, 12.0, 10.0, 14.0, 3.0, 7.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1414794921875, -0.13582229614257812, -0.13016510009765625, -0.12450790405273438, -0.1188507080078125, -0.11319351196289062, -0.10753631591796875, -0.10187911987304688, -0.096221923828125, -0.09056472778320312, -0.08490753173828125, -0.07925033569335938, -0.0735931396484375, -0.06793594360351562, -0.06227874755859375, -0.056621551513671875, -0.05096435546875, -0.045307159423828125, -0.03964996337890625, -0.033992767333984375, -0.0283355712890625, -0.022678375244140625, -0.01702117919921875, -0.011363983154296875, -0.005706787109375, -4.9591064453125e-05, 0.00560760498046875, 0.011264801025390625, 0.0169219970703125, 0.022579193115234375, 0.02823638916015625, 0.033893585205078125, 0.03955078125, 0.045207977294921875, 0.05086517333984375, 0.056522369384765625, 0.0621795654296875, 0.06783676147460938, 0.07349395751953125, 0.07915115356445312, 0.084808349609375, 0.09046554565429688, 0.09612274169921875, 0.10177993774414062, 0.1074371337890625, 0.11309432983398438, 0.11875152587890625, 0.12440872192382812, 0.13006591796875, 0.13572311401367188, 0.14138031005859375, 0.14703750610351562, 0.1526947021484375, 0.15835189819335938, 0.16400909423828125, 0.16966629028320312, 0.175323486328125, 0.18098068237304688, 0.18663787841796875, 0.19229507446289062, 0.1979522705078125, 0.20360946655273438, 0.20926666259765625, 0.21492385864257812, 0.2205810546875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 5.0, 10.0, 9.0, 15.0, 42.0, 88.0, 104.0, 209.0, 396.0, 713.0, 1360.0, 3118.0, 8207.0, 32173.0, 352408.0, 3678585.0, 91251.0, 16228.0, 5066.0, 2064.0, 1000.0, 565.0, 310.0, 138.0, 108.0, 45.0, 27.0, 23.0, 15.0, 4.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.359619140625, -0.3497047424316406, -0.33979034423828125, -0.3298759460449219, -0.3199615478515625, -0.3100471496582031, -0.30013275146484375, -0.2902183532714844, -0.280303955078125, -0.2703895568847656, -0.26047515869140625, -0.2505607604980469, -0.2406463623046875, -0.23073196411132812, -0.22081756591796875, -0.21090316772460938, -0.20098876953125, -0.19107437133789062, -0.18115997314453125, -0.17124557495117188, -0.1613311767578125, -0.15141677856445312, -0.14150238037109375, -0.13158798217773438, -0.121673583984375, -0.11175918579101562, -0.10184478759765625, -0.09193038940429688, -0.0820159912109375, -0.07210159301757812, -0.06218719482421875, -0.052272796630859375, -0.0423583984375, -0.032444000244140625, -0.02252960205078125, -0.012615203857421875, -0.0027008056640625, 0.007213592529296875, 0.01712799072265625, 0.027042388916015625, 0.036956787109375, 0.046871185302734375, 0.05678558349609375, 0.06669998168945312, 0.0766143798828125, 0.08652877807617188, 0.09644317626953125, 0.10635757446289062, 0.11627197265625, 0.12618637084960938, 0.13610076904296875, 0.14601516723632812, 0.1559295654296875, 0.16584396362304688, 0.17575836181640625, 0.18567276000976562, 0.195587158203125, 0.20550155639648438, 0.21541595458984375, 0.22533035278320312, 0.2352447509765625, 0.24515914916992188, 0.25507354736328125, 0.2649879455566406, 0.27490234375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 5.0, 1.0, 6.0, 9.0, 16.0, 22.0, 35.0, 70.0, 137.0, 526.0, 2500.0, 461.0, 132.0, 45.0, 37.0, 16.0, 15.0, 14.0, 6.0, 6.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1417236328125, -0.13691329956054688, -0.13210296630859375, -0.12729263305664062, -0.1224822998046875, -0.11767196655273438, -0.11286163330078125, -0.10805130004882812, -0.103240966796875, -0.09843063354492188, -0.09362030029296875, -0.08880996704101562, -0.0839996337890625, -0.07918930053710938, -0.07437896728515625, -0.06956863403320312, -0.06475830078125, -0.059947967529296875, -0.05513763427734375, -0.050327301025390625, -0.0455169677734375, -0.040706634521484375, -0.03589630126953125, -0.031085968017578125, -0.026275634765625, -0.021465301513671875, -0.01665496826171875, -0.011844635009765625, -0.0070343017578125, -0.002223968505859375, 0.00258636474609375, 0.007396697998046875, 0.01220703125, 0.017017364501953125, 0.02182769775390625, 0.026638031005859375, 0.0314483642578125, 0.036258697509765625, 0.04106903076171875, 0.045879364013671875, 0.050689697265625, 0.055500030517578125, 0.06031036376953125, 0.06512069702148438, 0.0699310302734375, 0.07474136352539062, 0.07955169677734375, 0.08436203002929688, 0.08917236328125, 0.09398269653320312, 0.09879302978515625, 0.10360336303710938, 0.1084136962890625, 0.11322402954101562, 0.11803436279296875, 0.12284469604492188, 0.127655029296875, 0.13246536254882812, 0.13727569580078125, 0.14208602905273438, 0.1468963623046875, 0.15170669555664062, 0.15651702880859375, 0.16132736206054688, 0.1661376953125]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 7.0, 1.0, 6.0, 10.0, 13.0, 33.0, 43.0, 73.0, 131.0, 158.0, 164.0, 149.0, 93.0, 65.0, 29.0, 14.0, 6.0, 7.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5560423731803894, -0.5384963154792786, -0.5209503173828125, -0.5034042596817017, -0.4858582317829132, -0.46831220388412476, -0.4507661461830139, -0.43322011828422546, -0.415674090385437, -0.39812806248664856, -0.3805820345878601, -0.36303597688674927, -0.3454899489879608, -0.32794392108917236, -0.3103978633880615, -0.29285183548927307, -0.2753058075904846, -0.25775977969169617, -0.24021373689174652, -0.22266769409179688, -0.20512166619300842, -0.18757563829421997, -0.17002959549427032, -0.15248355269432068, -0.13493752479553223, -0.11739148944616318, -0.09984545409679413, -0.08229941874742508, -0.06475338339805603, -0.04720734804868698, -0.029661312699317932, -0.012115277349948883, 0.005430698394775391, 0.02297673374414444, 0.04052276909351349, 0.05806880444288254, 0.07561483979225159, 0.09316087514162064, 0.11070691049098969, 0.12825295329093933, 0.14579898118972778, 0.16334500908851624, 0.18089105188846588, 0.19843709468841553, 0.21598312258720398, 0.23352915048599243, 0.25107520818710327, 0.2686212360858917, 0.2861672639846802, 0.30371329188346863, 0.3212593197822571, 0.3388053774833679, 0.35635140538215637, 0.3738974332809448, 0.39144349098205566, 0.4089895188808441, 0.42653554677963257, 0.444081574678421, 0.4616276025772095, 0.4791736602783203, 0.49671968817710876, 0.5142657160758972, 0.5318117737770081, 0.5493577718734741, 0.566903829574585]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 5.0, 16.0, 19.0, 16.0, 18.0, 23.0, 25.0, 32.0, 37.0, 45.0, 51.0, 45.0, 60.0, 57.0, 63.0, 63.0, 57.0, 70.0, 50.0, 44.0, 40.0, 31.0, 24.0, 31.0, 18.0, 11.0, 6.0, 16.0, 9.0, 5.0, 4.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.48112577199935913, -0.46922507882118225, -0.457324355840683, -0.4454236626625061, -0.43352293968200684, -0.42162224650382996, -0.4097215235233307, -0.3978208303451538, -0.38592010736465454, -0.37401941418647766, -0.3621186912059784, -0.3502179980278015, -0.33831727504730225, -0.32641658186912537, -0.3145158588886261, -0.3026151657104492, -0.29071444272994995, -0.27881374955177307, -0.2669130265712738, -0.2550123333930969, -0.24311161041259766, -0.23121090233325958, -0.2193101942539215, -0.20740950107574463, -0.19550880789756775, -0.18360809981822968, -0.1717073917388916, -0.15980668365955353, -0.14790597558021545, -0.13600526750087738, -0.1241045668721199, -0.11220385879278183, -0.10030314326286316, -0.08840243518352509, -0.07650172710418701, -0.06460101902484894, -0.05270031467080116, -0.04079960659146309, -0.028898902237415314, -0.01699819415807724, -0.005097486078739166, 0.006803221069276333, 0.018703928217291832, 0.030604634433984756, 0.04250534251332283, 0.054406050592660904, 0.06630675494670868, 0.07820746302604675, 0.09010817110538483, 0.1020088791847229, 0.11390958726406097, 0.12581029534339905, 0.13771100342273712, 0.1496117115020752, 0.16151240468025208, 0.17341312766075134, 0.18531382083892822, 0.1972145289182663, 0.20911523699760437, 0.22101594507694244, 0.23291665315628052, 0.2448173612356186, 0.25671806931495667, 0.26861876249313354, 0.2805194854736328]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 1.0, 4.0, 8.0, 15.0, 19.0, 20.0, 49.0, 77.0, 119.0, 262.0, 480.0, 1058.0, 2959.0, 11111.0, 73832.0, 674723.0, 250223.0, 25131.0, 5346.0, 1657.0, 726.0, 327.0, 158.0, 92.0, 62.0, 28.0, 22.0, 14.0, 12.0, 3.0, 6.0, 4.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.662109375, -0.6430511474609375, -0.623992919921875, -0.6049346923828125, -0.58587646484375, -0.5668182373046875, -0.547760009765625, -0.5287017822265625, -0.5096435546875, -0.4905853271484375, -0.471527099609375, -0.4524688720703125, -0.43341064453125, -0.4143524169921875, -0.395294189453125, -0.3762359619140625, -0.357177734375, -0.3381195068359375, -0.319061279296875, -0.3000030517578125, -0.28094482421875, -0.2618865966796875, -0.242828369140625, -0.2237701416015625, -0.2047119140625, -0.1856536865234375, -0.166595458984375, -0.1475372314453125, -0.12847900390625, -0.1094207763671875, -0.090362548828125, -0.0713043212890625, -0.05224609375, -0.0331878662109375, -0.014129638671875, 0.0049285888671875, 0.02398681640625, 0.0430450439453125, 0.062103271484375, 0.0811614990234375, 0.1002197265625, 0.1192779541015625, 0.138336181640625, 0.1573944091796875, 0.17645263671875, 0.1955108642578125, 0.214569091796875, 0.2336273193359375, 0.252685546875, 0.2717437744140625, 0.290802001953125, 0.3098602294921875, 0.32891845703125, 0.3479766845703125, 0.367034912109375, 0.3860931396484375, 0.4051513671875, 0.4242095947265625, 0.443267822265625, 0.4623260498046875, 0.48138427734375, 0.5004425048828125, 0.519500732421875, 0.5385589599609375, 0.5576171875]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 4.0, 2.0, 5.0, 12.0, 13.0, 17.0, 28.0, 43.0, 63.0, 102.0, 95.0, 101.0, 127.0, 104.0, 75.0, 63.0, 51.0, 32.0, 22.0, 19.0, 6.0, 12.0, 5.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1619873046875, -0.1560192108154297, -0.15005111694335938, -0.14408302307128906, -0.13811492919921875, -0.13214683532714844, -0.12617874145507812, -0.12021064758300781, -0.1142425537109375, -0.10827445983886719, -0.10230636596679688, -0.09633827209472656, -0.09037017822265625, -0.08440208435058594, -0.07843399047851562, -0.07246589660644531, -0.066497802734375, -0.06052970886230469, -0.054561614990234375, -0.04859352111816406, -0.04262542724609375, -0.03665733337402344, -0.030689239501953125, -0.024721145629882812, -0.0187530517578125, -0.012784957885742188, -0.006816864013671875, -0.0008487701416015625, 0.00511932373046875, 0.011087417602539062, 0.017055511474609375, 0.023023605346679688, 0.02899169921875, 0.03495979309082031, 0.040927886962890625, 0.04689598083496094, 0.05286407470703125, 0.05883216857910156, 0.06480026245117188, 0.07076835632324219, 0.0767364501953125, 0.08270454406738281, 0.08867263793945312, 0.09464073181152344, 0.10060882568359375, 0.10657691955566406, 0.11254501342773438, 0.11851310729980469, 0.124481201171875, 0.1304492950439453, 0.13641738891601562, 0.14238548278808594, 0.14835357666015625, 0.15432167053222656, 0.16028976440429688, 0.1662578582763672, 0.1722259521484375, 0.1781940460205078, 0.18416213989257812, 0.19013023376464844, 0.19609832763671875, 0.20206642150878906, 0.20803451538085938, 0.2140026092529297, 0.219970703125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 4.0, 10.0, 3.0, 18.0, 20.0, 18.0, 41.0, 45.0, 97.0, 145.0, 311.0, 587.0, 1266.0, 3497.0, 10719.0, 42070.0, 226977.0, 574208.0, 147034.0, 28707.0, 7993.0, 2644.0, 1058.0, 501.0, 209.0, 135.0, 81.0, 62.0, 33.0, 17.0, 10.0, 16.0, 4.0, 6.0, 4.0, 1.0, 6.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33447265625, -0.3241424560546875, -0.313812255859375, -0.3034820556640625, -0.29315185546875, -0.2828216552734375, -0.272491455078125, -0.2621612548828125, -0.2518310546875, -0.2415008544921875, -0.231170654296875, -0.2208404541015625, -0.21051025390625, -0.2001800537109375, -0.189849853515625, -0.1795196533203125, -0.169189453125, -0.1588592529296875, -0.148529052734375, -0.1381988525390625, -0.12786865234375, -0.1175384521484375, -0.107208251953125, -0.0968780517578125, -0.0865478515625, -0.0762176513671875, -0.065887451171875, -0.0555572509765625, -0.04522705078125, -0.0348968505859375, -0.024566650390625, -0.0142364501953125, -0.00390625, 0.0064239501953125, 0.016754150390625, 0.0270843505859375, 0.03741455078125, 0.0477447509765625, 0.058074951171875, 0.0684051513671875, 0.0787353515625, 0.0890655517578125, 0.099395751953125, 0.1097259521484375, 0.12005615234375, 0.1303863525390625, 0.140716552734375, 0.1510467529296875, 0.161376953125, 0.1717071533203125, 0.182037353515625, 0.1923675537109375, 0.20269775390625, 0.2130279541015625, 0.223358154296875, 0.2336883544921875, 0.2440185546875, 0.2543487548828125, 0.264678955078125, 0.2750091552734375, 0.28533935546875, 0.2956695556640625, 0.305999755859375, 0.3163299560546875, 0.32666015625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0, 6.0, 5.0, 7.0, 9.0, 10.0, 11.0, 17.0, 8.0, 22.0, 19.0, 24.0, 25.0, 25.0, 42.0, 50.0, 35.0, 50.0, 47.0, 47.0, 47.0, 52.0, 54.0, 45.0, 45.0, 42.0, 45.0, 34.0, 36.0, 25.0, 25.0, 12.0, 15.0, 13.0, 14.0, 5.0, 8.0, 8.0, 5.0, 3.0, 4.0, 5.0, 1.0, 3.0, 0.0, 3.0, 0.0, 4.0], "bins": [-0.475341796875, -0.46256256103515625, -0.4497833251953125, -0.43700408935546875, -0.424224853515625, -0.41144561767578125, -0.3986663818359375, -0.38588714599609375, -0.37310791015625, -0.36032867431640625, -0.3475494384765625, -0.33477020263671875, -0.321990966796875, -0.30921173095703125, -0.2964324951171875, -0.28365325927734375, -0.2708740234375, -0.25809478759765625, -0.2453155517578125, -0.23253631591796875, -0.219757080078125, -0.20697784423828125, -0.1941986083984375, -0.18141937255859375, -0.16864013671875, -0.15586090087890625, -0.1430816650390625, -0.13030242919921875, -0.117523193359375, -0.10474395751953125, -0.0919647216796875, -0.07918548583984375, -0.06640625, -0.05362701416015625, -0.0408477783203125, -0.02806854248046875, -0.015289306640625, -0.00251007080078125, 0.0102691650390625, 0.02304840087890625, 0.03582763671875, 0.04860687255859375, 0.0613861083984375, 0.07416534423828125, 0.086944580078125, 0.09972381591796875, 0.1125030517578125, 0.12528228759765625, 0.1380615234375, 0.15084075927734375, 0.1636199951171875, 0.17639923095703125, 0.189178466796875, 0.20195770263671875, 0.2147369384765625, 0.22751617431640625, 0.24029541015625, 0.25307464599609375, 0.2658538818359375, 0.27863311767578125, 0.291412353515625, 0.30419158935546875, 0.3169708251953125, 0.32975006103515625, 0.342529296875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 5.0, 8.0, 6.0, 14.0, 18.0, 36.0, 70.0, 149.0, 290.0, 783.0, 3063.0, 23872.0, 625264.0, 374216.0, 17049.0, 2454.0, 697.0, 279.0, 132.0, 69.0, 41.0, 14.0, 11.0, 7.0, 5.0, 3.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2373046875, -0.22910308837890625, -0.2209014892578125, -0.21269989013671875, -0.204498291015625, -0.19629669189453125, -0.1880950927734375, -0.17989349365234375, -0.17169189453125, -0.16349029541015625, -0.1552886962890625, -0.14708709716796875, -0.138885498046875, -0.13068389892578125, -0.1224822998046875, -0.11428070068359375, -0.1060791015625, -0.09787750244140625, -0.0896759033203125, -0.08147430419921875, -0.073272705078125, -0.06507110595703125, -0.0568695068359375, -0.04866790771484375, -0.04046630859375, -0.03226470947265625, -0.0240631103515625, -0.01586151123046875, -0.007659912109375, 0.00054168701171875, 0.0087432861328125, 0.01694488525390625, 0.025146484375, 0.03334808349609375, 0.0415496826171875, 0.04975128173828125, 0.057952880859375, 0.06615447998046875, 0.0743560791015625, 0.08255767822265625, 0.09075927734375, 0.09896087646484375, 0.1071624755859375, 0.11536407470703125, 0.123565673828125, 0.13176727294921875, 0.1399688720703125, 0.14817047119140625, 0.1563720703125, 0.16457366943359375, 0.1727752685546875, 0.18097686767578125, 0.189178466796875, 0.19738006591796875, 0.2055816650390625, 0.21378326416015625, 0.22198486328125, 0.23018646240234375, 0.2383880615234375, 0.24658966064453125, 0.254791259765625, 0.26299285888671875, 0.2711944580078125, 0.27939605712890625, 0.28759765625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 2.0, 6.0, 1.0, 15.0, 18.0, 12.0, 16.0, 39.0, 33.0, 46.0, 70.0, 125.0, 156.0, 138.0, 85.0, 60.0, 50.0, 38.0, 29.0, 18.0, 10.0, 10.0, 11.0, 8.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001074671745300293, -0.00010296422988176346, -9.846128523349762e-05, -9.395834058523178e-05, -8.945539593696594e-05, -8.49524512887001e-05, -8.044950664043427e-05, -7.594656199216843e-05, -7.144361734390259e-05, -6.694067269563675e-05, -6.243772804737091e-05, -5.793478339910507e-05, -5.3431838750839233e-05, -4.8928894102573395e-05, -4.4425949454307556e-05, -3.992300480604172e-05, -3.542006015777588e-05, -3.091711550951004e-05, -2.64141708612442e-05, -2.1911226212978363e-05, -1.7408281564712524e-05, -1.2905336916446686e-05, -8.402392268180847e-06, -3.8994476199150085e-06, 6.034970283508301e-07, 5.106441676616669e-06, 9.609386324882507e-06, 1.4112330973148346e-05, 1.8615275621414185e-05, 2.3118220269680023e-05, 2.7621164917945862e-05, 3.21241095662117e-05, 3.662705421447754e-05, 4.112999886274338e-05, 4.5632943511009216e-05, 5.0135888159275055e-05, 5.4638832807540894e-05, 5.914177745580673e-05, 6.364472210407257e-05, 6.814766675233841e-05, 7.265061140060425e-05, 7.715355604887009e-05, 8.165650069713593e-05, 8.615944534540176e-05, 9.06623899936676e-05, 9.516533464193344e-05, 9.966827929019928e-05, 0.00010417122393846512, 0.00010867416858673096, 0.0001131771132349968, 0.00011768005788326263, 0.00012218300253152847, 0.0001266859471797943, 0.00013118889182806015, 0.000135691836476326, 0.00014019478112459183, 0.00014469772577285767, 0.0001492006704211235, 0.00015370361506938934, 0.00015820655971765518, 0.00016270950436592102, 0.00016721244901418686, 0.0001717153936624527, 0.00017621833831071854, 0.00018072128295898438]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 10.0, 12.0, 17.0, 27.0, 31.0, 57.0, 92.0, 143.0, 282.0, 579.0, 1493.0, 5981.0, 43199.0, 553106.0, 403427.0, 32525.0, 4986.0, 1362.0, 536.0, 273.0, 143.0, 104.0, 57.0, 35.0, 27.0, 21.0, 11.0, 5.0, 1.0, 3.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2342529296875, -0.22754859924316406, -0.22084426879882812, -0.2141399383544922, -0.20743560791015625, -0.2007312774658203, -0.19402694702148438, -0.18732261657714844, -0.1806182861328125, -0.17391395568847656, -0.16720962524414062, -0.1605052947998047, -0.15380096435546875, -0.1470966339111328, -0.14039230346679688, -0.13368797302246094, -0.126983642578125, -0.12027931213378906, -0.11357498168945312, -0.10687065124511719, -0.10016632080078125, -0.09346199035644531, -0.08675765991210938, -0.08005332946777344, -0.0733489990234375, -0.06664466857910156, -0.059940338134765625, -0.05323600769042969, -0.04653167724609375, -0.03982734680175781, -0.033123016357421875, -0.026418685913085938, -0.01971435546875, -0.013010025024414062, -0.006305694580078125, 0.0003986358642578125, 0.00710296630859375, 0.013807296752929688, 0.020511627197265625, 0.027215957641601562, 0.0339202880859375, 0.04062461853027344, 0.047328948974609375, 0.05403327941894531, 0.06073760986328125, 0.06744194030761719, 0.07414627075195312, 0.08085060119628906, 0.087554931640625, 0.09425926208496094, 0.10096359252929688, 0.10766792297363281, 0.11437225341796875, 0.12107658386230469, 0.12778091430664062, 0.13448524475097656, 0.1411895751953125, 0.14789390563964844, 0.15459823608398438, 0.1613025665283203, 0.16800689697265625, 0.1747112274169922, 0.18141555786132812, 0.18811988830566406, 0.19482421875]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 6.0, 12.0, 15.0, 18.0, 25.0, 23.0, 70.0, 80.0, 96.0, 157.0, 160.0, 125.0, 56.0, 44.0, 45.0, 25.0, 20.0, 11.0, 8.0, 3.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10101318359375, -0.0947122573852539, -0.08841133117675781, -0.08211040496826172, -0.07580947875976562, -0.06950855255126953, -0.06320762634277344, -0.056906700134277344, -0.05060577392578125, -0.044304847717285156, -0.03800392150878906, -0.03170299530029297, -0.025402069091796875, -0.01910114288330078, -0.012800216674804688, -0.006499290466308594, -0.0001983642578125, 0.006102561950683594, 0.012403488159179688, 0.01870441436767578, 0.025005340576171875, 0.03130626678466797, 0.03760719299316406, 0.043908119201660156, 0.05020904541015625, 0.056509971618652344, 0.06281089782714844, 0.06911182403564453, 0.07541275024414062, 0.08171367645263672, 0.08801460266113281, 0.0943155288696289, 0.100616455078125, 0.1069173812866211, 0.11321830749511719, 0.11951923370361328, 0.12582015991210938, 0.13212108612060547, 0.13842201232910156, 0.14472293853759766, 0.15102386474609375, 0.15732479095458984, 0.16362571716308594, 0.16992664337158203, 0.17622756958007812, 0.18252849578857422, 0.1888294219970703, 0.1951303482055664, 0.2014312744140625, 0.2077322006225586, 0.2140331268310547, 0.22033405303955078, 0.22663497924804688, 0.23293590545654297, 0.23923683166503906, 0.24553775787353516, 0.25183868408203125, 0.25813961029052734, 0.26444053649902344, 0.27074146270751953, 0.2770423889160156, 0.2833433151245117, 0.2896442413330078, 0.2959451675415039, 0.30224609375]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 4.0, 6.0, 8.0, 17.0, 30.0, 65.0, 113.0, 183.0, 207.0, 191.0, 100.0, 52.0, 16.0, 12.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.8654857873916626, -1.7591750621795654, -1.6528642177581787, -1.5465534925460815, -1.4402427673339844, -1.3339320421218872, -1.22762131690979, -1.1213104724884033, -1.0149997472763062, -0.908689022064209, -0.802378237247467, -0.6960674524307251, -0.5897567272186279, -0.48344600200653076, -0.3771352171897888, -0.2708244323730469, -0.1645137071609497, -0.05820295214653015, 0.048107802867889404, 0.15441855788230896, 0.2607293128967285, 0.3670400381088257, 0.4733508229255676, 0.5796616077423096, 0.6859723329544067, 0.7922830581665039, 0.8985938429832458, 1.0049046277999878, 1.111215353012085, 1.2175260782241821, 1.3238368034362793, 1.430147647857666, 1.5364584922790527, 1.64276921749115, 1.749079942703247, 1.8553907871246338, 1.961701512336731, 2.068012237548828, 2.174323081970215, 2.2806339263916016, 2.386944532394409, 2.493255376815796, 2.5995659828186035, 2.7058768272399902, 2.812187671661377, 2.9184982776641846, 3.0248091220855713, 3.131119728088379, 3.2374305725097656, 3.3437414169311523, 3.45005202293396, 3.5563628673553467, 3.6626734733581543, 3.768984317779541, 3.8752951622009277, 3.9816060066223145, 4.087916374206543, 4.19422721862793, 4.300538063049316, 4.406848430633545, 4.513159275054932, 4.619470119476318, 4.725780963897705, 4.832091808319092, 4.9384026527404785]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 7.0, 8.0, 11.0, 10.0, 13.0, 12.0, 17.0, 15.0, 23.0, 45.0, 35.0, 41.0, 27.0, 44.0, 43.0, 44.0, 47.0, 55.0, 35.0, 63.0, 51.0, 44.0, 41.0, 31.0, 25.0, 33.0, 32.0, 25.0, 20.0, 17.0, 21.0, 12.0, 12.0, 13.0, 7.0, 3.0, 10.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.0801477432250977, -2.0130786895751953, -1.9460097551345825, -1.8789407014846802, -1.8118717670440674, -1.744802713394165, -1.6777336597442627, -1.61066472530365, -1.543595790863037, -1.4765267372131348, -1.409457802772522, -1.3423887491226196, -1.2753198146820068, -1.2082507610321045, -1.1411817073822021, -1.0741127729415894, -1.007043719291687, -0.9399747252464294, -0.8729057312011719, -0.8058366775512695, -0.7387677431106567, -0.6716986894607544, -0.6046296954154968, -0.5375607013702393, -0.4704917073249817, -0.4034227132797241, -0.33635371923446655, -0.2692846953868866, -0.20221570134162903, -0.13514670729637146, -0.0680776834487915, -0.0010086894035339355, 0.06606030464172363, 0.1331292986869812, 0.20019830763339996, 0.2672673165798187, 0.3343363106250763, 0.40140530467033386, 0.4684743285179138, 0.5355433225631714, 0.602612316608429, 0.6696813106536865, 0.7367503046989441, 0.8038192987442017, 0.870888352394104, 0.9379572868347168, 1.0050263404846191, 1.0720953941345215, 1.1391643285751343, 1.2062333822250366, 1.2733023166656494, 1.3403713703155518, 1.4074403047561646, 1.474509358406067, 1.5415782928466797, 1.608647346496582, 1.6757164001464844, 1.7427854537963867, 1.8098543882369995, 1.8769234418869019, 1.9439923763275146, 2.011061429977417, 2.0781304836273193, 2.1451992988586426, 2.212268352508545]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 0.0, 3.0, 5.0, 2.0, 16.0, 10.0, 16.0, 35.0, 43.0, 62.0, 117.0, 164.0, 337.0, 655.0, 1555.0, 4455.0, 18955.0, 343510.0, 3771826.0, 41356.0, 7213.0, 2128.0, 876.0, 380.0, 218.0, 113.0, 87.0, 49.0, 37.0, 17.0, 11.0, 10.0, 10.0, 2.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.471923828125, -0.4539070129394531, -0.43589019775390625, -0.4178733825683594, -0.3998565673828125, -0.3818397521972656, -0.36382293701171875, -0.3458061218261719, -0.327789306640625, -0.3097724914550781, -0.29175567626953125, -0.2737388610839844, -0.2557220458984375, -0.23770523071289062, -0.21968841552734375, -0.20167160034179688, -0.18365478515625, -0.16563796997070312, -0.14762115478515625, -0.12960433959960938, -0.1115875244140625, -0.09357070922851562, -0.07555389404296875, -0.057537078857421875, -0.039520263671875, -0.021503448486328125, -0.00348663330078125, 0.014530181884765625, 0.0325469970703125, 0.050563812255859375, 0.06858062744140625, 0.08659744262695312, 0.1046142578125, 0.12263107299804688, 0.14064788818359375, 0.15866470336914062, 0.1766815185546875, 0.19469833374023438, 0.21271514892578125, 0.23073196411132812, 0.248748779296875, 0.2667655944824219, 0.28478240966796875, 0.3027992248535156, 0.3208160400390625, 0.3388328552246094, 0.35684967041015625, 0.3748664855957031, 0.39288330078125, 0.4109001159667969, 0.42891693115234375, 0.4469337463378906, 0.4649505615234375, 0.4829673767089844, 0.5009841918945312, 0.5190010070800781, 0.537017822265625, 0.5550346374511719, 0.5730514526367188, 0.5910682678222656, 0.6090850830078125, 0.6271018981933594, 0.6451187133789062, 0.6631355285644531, 0.68115234375]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 9.0, 5.0, 6.0, 18.0, 22.0, 25.0, 41.0, 63.0, 67.0, 92.0, 103.0, 81.0, 98.0, 84.0, 81.0, 61.0, 54.0, 28.0, 20.0, 15.0, 11.0, 6.0, 7.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1649169921875, -0.15894508361816406, -0.15297317504882812, -0.1470012664794922, -0.14102935791015625, -0.1350574493408203, -0.12908554077148438, -0.12311363220214844, -0.1171417236328125, -0.11116981506347656, -0.10519790649414062, -0.09922599792480469, -0.09325408935546875, -0.08728218078613281, -0.08131027221679688, -0.07533836364746094, -0.069366455078125, -0.06339454650878906, -0.057422637939453125, -0.05145072937011719, -0.04547882080078125, -0.03950691223144531, -0.033535003662109375, -0.027563095092773438, -0.0215911865234375, -0.015619277954101562, -0.009647369384765625, -0.0036754608154296875, 0.00229644775390625, 0.008268356323242188, 0.014240264892578125, 0.020212173461914062, 0.02618408203125, 0.03215599060058594, 0.038127899169921875, 0.04409980773925781, 0.05007171630859375, 0.05604362487792969, 0.062015533447265625, 0.06798744201660156, 0.0739593505859375, 0.07993125915527344, 0.08590316772460938, 0.09187507629394531, 0.09784698486328125, 0.10381889343261719, 0.10979080200195312, 0.11576271057128906, 0.121734619140625, 0.12770652770996094, 0.13367843627929688, 0.1396503448486328, 0.14562225341796875, 0.1515941619873047, 0.15756607055664062, 0.16353797912597656, 0.1695098876953125, 0.17548179626464844, 0.18145370483398438, 0.1874256134033203, 0.19339752197265625, 0.1993694305419922, 0.20534133911132812, 0.21131324768066406, 0.21728515625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 1.0, 2.0, 5.0, 4.0, 15.0, 8.0, 5.0, 16.0, 25.0, 28.0, 48.0, 61.0, 81.0, 130.0, 168.0, 267.0, 389.0, 596.0, 889.0, 1523.0, 2535.0, 4847.0, 9904.0, 25458.0, 90461.0, 868871.0, 2961743.0, 161409.0, 37395.0, 13252.0, 5915.0, 3165.0, 1760.0, 1069.0, 709.0, 449.0, 301.0, 232.0, 159.0, 131.0, 72.0, 46.0, 36.0, 33.0, 22.0, 17.0, 10.0, 6.0, 4.0, 3.0, 2.0, 3.0, 5.0, 4.0, 1.0], "bins": [-0.2296142578125, -0.2230854034423828, -0.21655654907226562, -0.21002769470214844, -0.20349884033203125, -0.19696998596191406, -0.19044113159179688, -0.1839122772216797, -0.1773834228515625, -0.1708545684814453, -0.16432571411132812, -0.15779685974121094, -0.15126800537109375, -0.14473915100097656, -0.13821029663085938, -0.1316814422607422, -0.125152587890625, -0.11862373352050781, -0.11209487915039062, -0.10556602478027344, -0.09903717041015625, -0.09250831604003906, -0.08597946166992188, -0.07945060729980469, -0.0729217529296875, -0.06639289855957031, -0.059864044189453125, -0.05333518981933594, -0.04680633544921875, -0.04027748107910156, -0.033748626708984375, -0.027219772338867188, -0.02069091796875, -0.014162063598632812, -0.007633209228515625, -0.0011043548583984375, 0.00542449951171875, 0.011953353881835938, 0.018482208251953125, 0.025011062622070312, 0.0315399169921875, 0.03806877136230469, 0.044597625732421875, 0.05112648010253906, 0.05765533447265625, 0.06418418884277344, 0.07071304321289062, 0.07724189758300781, 0.083770751953125, 0.09029960632324219, 0.09682846069335938, 0.10335731506347656, 0.10988616943359375, 0.11641502380371094, 0.12294387817382812, 0.1294727325439453, 0.1360015869140625, 0.1425304412841797, 0.14905929565429688, 0.15558815002441406, 0.16211700439453125, 0.16864585876464844, 0.17517471313476562, 0.1817035675048828, 0.188232421875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 2.0, 5.0, 3.0, 2.0, 3.0, 9.0, 8.0, 18.0, 16.0, 31.0, 52.0, 82.0, 211.0, 886.0, 2012.0, 380.0, 151.0, 79.0, 37.0, 24.0, 21.0, 8.0, 12.0, 7.0, 1.0, 5.0, 4.0, 4.0, 0.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1427001953125, -0.136810302734375, -0.13092041015625, -0.125030517578125, -0.119140625, -0.113250732421875, -0.10736083984375, -0.101470947265625, -0.0955810546875, -0.089691162109375, -0.08380126953125, -0.077911376953125, -0.072021484375, -0.066131591796875, -0.06024169921875, -0.054351806640625, -0.0484619140625, -0.042572021484375, -0.03668212890625, -0.030792236328125, -0.02490234375, -0.019012451171875, -0.01312255859375, -0.007232666015625, -0.0013427734375, 0.004547119140625, 0.01043701171875, 0.016326904296875, 0.022216796875, 0.028106689453125, 0.03399658203125, 0.039886474609375, 0.0457763671875, 0.051666259765625, 0.05755615234375, 0.063446044921875, 0.0693359375, 0.075225830078125, 0.08111572265625, 0.087005615234375, 0.0928955078125, 0.098785400390625, 0.10467529296875, 0.110565185546875, 0.116455078125, 0.122344970703125, 0.12823486328125, 0.134124755859375, 0.1400146484375, 0.145904541015625, 0.15179443359375, 0.157684326171875, 0.16357421875, 0.169464111328125, 0.17535400390625, 0.181243896484375, 0.1871337890625, 0.193023681640625, 0.19891357421875, 0.204803466796875, 0.210693359375, 0.216583251953125, 0.22247314453125, 0.228363037109375, 0.2342529296875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 5.0, 6.0, 6.0, 21.0, 39.0, 48.0, 99.0, 124.0, 162.0, 143.0, 116.0, 96.0, 43.0, 39.0, 19.0, 13.0, 8.0, 6.0, 4.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.5749846696853638, -0.5522289276123047, -0.5294732451438904, -0.5067175030708313, -0.4839617609977722, -0.4612060487270355, -0.43845033645629883, -0.41569459438323975, -0.39293888211250305, -0.37018316984176636, -0.3474274277687073, -0.3246717154979706, -0.3019160032272339, -0.2791602611541748, -0.2564045488834381, -0.23364882171154022, -0.21089309453964233, -0.18813736736774445, -0.16538164019584656, -0.14262592792510986, -0.11987020075321198, -0.09711447358131409, -0.07435876131057739, -0.051603034138679504, -0.028847306966781616, -0.0060915835201740265, 0.016664139926433563, 0.039419859647750854, 0.06217558681964874, 0.08493131399154663, 0.10768702626228333, 0.1304427534341812, 0.15319854021072388, 0.17595426738262177, 0.19870999455451965, 0.22146570682525635, 0.24422143399715424, 0.2669771611690521, 0.2897328734397888, 0.3124886155128479, 0.3352443277835846, 0.3580000400543213, 0.38075578212738037, 0.40351149439811707, 0.42626720666885376, 0.44902294874191284, 0.47177866101264954, 0.49453437328338623, 0.5172901153564453, 0.5400458574295044, 0.5628015398979187, 0.5855572819709778, 0.6083130240440369, 0.6310687065124512, 0.6538244485855103, 0.6765801906585693, 0.6993359327316284, 0.7220916748046875, 0.7448473572731018, 0.7676030993461609, 0.79035884141922, 0.8131145238876343, 0.8358702659606934, 0.8586260080337524, 0.8813816905021667]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 2.0, 1.0, 3.0, 4.0, 9.0, 10.0, 12.0, 16.0, 25.0, 22.0, 27.0, 35.0, 31.0, 35.0, 45.0, 36.0, 52.0, 54.0, 48.0, 61.0, 44.0, 43.0, 51.0, 49.0, 39.0, 46.0, 41.0, 29.0, 24.0, 23.0, 20.0, 14.0, 8.0, 14.0, 7.0, 6.0, 6.0, 5.0, 6.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.5550470948219299, -0.5390156507492065, -0.5229842662811279, -0.5069528222084045, -0.49092140793800354, -0.47488999366760254, -0.45885854959487915, -0.44282713532447815, -0.42679572105407715, -0.41076430678367615, -0.39473289251327515, -0.37870144844055176, -0.36267003417015076, -0.34663861989974976, -0.33060717582702637, -0.31457576155662537, -0.29854434728622437, -0.28251293301582336, -0.26648151874542236, -0.250450074672699, -0.23441866040229797, -0.21838724613189697, -0.20235581696033478, -0.18632438778877258, -0.17029297351837158, -0.15426155924797058, -0.1382301300764084, -0.12219870835542679, -0.10616728663444519, -0.09013586491346359, -0.074104443192482, -0.0580730214715004, -0.0420415997505188, -0.0260101780295372, -0.009978756308555603, 0.006052665412425995, 0.022084087133407593, 0.03811550885438919, 0.05414693057537079, 0.07017835229635239, 0.08620977401733398, 0.10224119573831558, 0.11827261745929718, 0.13430404663085938, 0.15033546090126038, 0.16636687517166138, 0.18239830434322357, 0.19842973351478577, 0.21446114778518677, 0.23049256205558777, 0.24652399122714996, 0.26255542039871216, 0.27858683466911316, 0.29461824893951416, 0.31064969301223755, 0.32668110728263855, 0.34271252155303955, 0.35874393582344055, 0.37477535009384155, 0.39080679416656494, 0.40683820843696594, 0.42286962270736694, 0.43890106678009033, 0.45493248105049133, 0.47096389532089233]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 3.0, 3.0, 1.0, 4.0, 7.0, 1.0, 5.0, 9.0, 14.0, 21.0, 27.0, 30.0, 43.0, 74.0, 112.0, 192.0, 313.0, 552.0, 1063.0, 2232.0, 5528.0, 16864.0, 71210.0, 354578.0, 454776.0, 105481.0, 22932.0, 6925.0, 2670.0, 1272.0, 640.0, 349.0, 214.0, 138.0, 80.0, 55.0, 46.0, 28.0, 19.0, 13.0, 12.0, 10.0, 6.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.34716796875, -0.3343658447265625, -0.321563720703125, -0.3087615966796875, -0.29595947265625, -0.2831573486328125, -0.270355224609375, -0.2575531005859375, -0.2447509765625, -0.2319488525390625, -0.219146728515625, -0.2063446044921875, -0.19354248046875, -0.1807403564453125, -0.167938232421875, -0.1551361083984375, -0.142333984375, -0.1295318603515625, -0.116729736328125, -0.1039276123046875, -0.09112548828125, -0.0783233642578125, -0.065521240234375, -0.0527191162109375, -0.0399169921875, -0.0271148681640625, -0.014312744140625, -0.0015106201171875, 0.01129150390625, 0.0240936279296875, 0.036895751953125, 0.0496978759765625, 0.0625, 0.0753021240234375, 0.088104248046875, 0.1009063720703125, 0.11370849609375, 0.1265106201171875, 0.139312744140625, 0.1521148681640625, 0.1649169921875, 0.1777191162109375, 0.190521240234375, 0.2033233642578125, 0.21612548828125, 0.2289276123046875, 0.241729736328125, 0.2545318603515625, 0.267333984375, 0.2801361083984375, 0.292938232421875, 0.3057403564453125, 0.31854248046875, 0.3313446044921875, 0.344146728515625, 0.3569488525390625, 0.3697509765625, 0.3825531005859375, 0.395355224609375, 0.4081573486328125, 0.42095947265625, 0.4337615966796875, 0.446563720703125, 0.4593658447265625, 0.47216796875]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 7.0, 8.0, 10.0, 14.0, 28.0, 36.0, 42.0, 74.0, 97.0, 82.0, 93.0, 106.0, 91.0, 81.0, 68.0, 50.0, 40.0, 26.0, 18.0, 9.0, 8.0, 4.0, 5.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1650390625, -0.15892410278320312, -0.15280914306640625, -0.14669418334960938, -0.1405792236328125, -0.13446426391601562, -0.12834930419921875, -0.12223434448242188, -0.116119384765625, -0.11000442504882812, -0.10388946533203125, -0.09777450561523438, -0.0916595458984375, -0.08554458618164062, -0.07942962646484375, -0.07331466674804688, -0.06719970703125, -0.061084747314453125, -0.05496978759765625, -0.048854827880859375, -0.0427398681640625, -0.036624908447265625, -0.03050994873046875, -0.024394989013671875, -0.018280029296875, -0.012165069580078125, -0.00605010986328125, 6.4849853515625e-05, 0.0061798095703125, 0.012294769287109375, 0.01840972900390625, 0.024524688720703125, 0.0306396484375, 0.036754608154296875, 0.04286956787109375, 0.048984527587890625, 0.0550994873046875, 0.061214447021484375, 0.06732940673828125, 0.07344436645507812, 0.079559326171875, 0.08567428588867188, 0.09178924560546875, 0.09790420532226562, 0.1040191650390625, 0.11013412475585938, 0.11624908447265625, 0.12236404418945312, 0.12847900390625, 0.13459396362304688, 0.14070892333984375, 0.14682388305664062, 0.1529388427734375, 0.15905380249023438, 0.16516876220703125, 0.17128372192382812, 0.177398681640625, 0.18351364135742188, 0.18962860107421875, 0.19574356079101562, 0.2018585205078125, 0.20797348022460938, 0.21408843994140625, 0.22020339965820312, 0.226318359375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 6.0, 1.0, 6.0, 6.0, 5.0, 19.0, 13.0, 36.0, 72.0, 110.0, 225.0, 499.0, 1158.0, 4515.0, 30682.0, 418591.0, 544609.0, 40099.0, 5468.0, 1361.0, 520.0, 258.0, 125.0, 74.0, 39.0, 26.0, 13.0, 6.0, 5.0, 7.0, 4.0, 4.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6708984375, -0.650604248046875, -0.63031005859375, -0.610015869140625, -0.5897216796875, -0.569427490234375, -0.54913330078125, -0.528839111328125, -0.508544921875, -0.488250732421875, -0.46795654296875, -0.447662353515625, -0.4273681640625, -0.407073974609375, -0.38677978515625, -0.366485595703125, -0.34619140625, -0.325897216796875, -0.30560302734375, -0.285308837890625, -0.2650146484375, -0.244720458984375, -0.22442626953125, -0.204132080078125, -0.183837890625, -0.163543701171875, -0.14324951171875, -0.122955322265625, -0.1026611328125, -0.082366943359375, -0.06207275390625, -0.041778564453125, -0.021484375, -0.001190185546875, 0.01910400390625, 0.039398193359375, 0.0596923828125, 0.079986572265625, 0.10028076171875, 0.120574951171875, 0.140869140625, 0.161163330078125, 0.18145751953125, 0.201751708984375, 0.2220458984375, 0.242340087890625, 0.26263427734375, 0.282928466796875, 0.30322265625, 0.323516845703125, 0.34381103515625, 0.364105224609375, 0.3843994140625, 0.404693603515625, 0.42498779296875, 0.445281982421875, 0.465576171875, 0.485870361328125, 0.50616455078125, 0.526458740234375, 0.5467529296875, 0.567047119140625, 0.58734130859375, 0.607635498046875, 0.6279296875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 5.0, 8.0, 13.0, 8.0, 15.0, 14.0, 16.0, 30.0, 38.0, 51.0, 51.0, 54.0, 52.0, 59.0, 59.0, 53.0, 64.0, 52.0, 68.0, 50.0, 42.0, 34.0, 36.0, 38.0, 23.0, 12.0, 14.0, 14.0, 9.0, 11.0, 3.0, 5.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.68896484375, -0.6678695678710938, -0.6467742919921875, -0.6256790161132812, -0.604583740234375, -0.5834884643554688, -0.5623931884765625, -0.5412979125976562, -0.52020263671875, -0.49910736083984375, -0.4780120849609375, -0.45691680908203125, -0.435821533203125, -0.41472625732421875, -0.3936309814453125, -0.37253570556640625, -0.3514404296875, -0.33034515380859375, -0.3092498779296875, -0.28815460205078125, -0.267059326171875, -0.24596405029296875, -0.2248687744140625, -0.20377349853515625, -0.18267822265625, -0.16158294677734375, -0.1404876708984375, -0.11939239501953125, -0.098297119140625, -0.07720184326171875, -0.0561065673828125, -0.03501129150390625, -0.013916015625, 0.00717926025390625, 0.0282745361328125, 0.04936981201171875, 0.070465087890625, 0.09156036376953125, 0.1126556396484375, 0.13375091552734375, 0.15484619140625, 0.17594146728515625, 0.1970367431640625, 0.21813201904296875, 0.239227294921875, 0.26032257080078125, 0.2814178466796875, 0.30251312255859375, 0.3236083984375, 0.34470367431640625, 0.3657989501953125, 0.38689422607421875, 0.407989501953125, 0.42908477783203125, 0.4501800537109375, 0.47127532958984375, 0.49237060546875, 0.5134658813476562, 0.5345611572265625, 0.5556564331054688, 0.576751708984375, 0.5978469848632812, 0.6189422607421875, 0.6400375366210938, 0.6611328125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 6.0, 1.0, 4.0, 11.0, 13.0, 21.0, 30.0, 32.0, 69.0, 122.0, 205.0, 409.0, 978.0, 2645.0, 9077.0, 53657.0, 580858.0, 358291.0, 31989.0, 6519.0, 2014.0, 795.0, 356.0, 188.0, 96.0, 58.0, 36.0, 18.0, 25.0, 16.0, 11.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1993408203125, -0.19243812561035156, -0.18553543090820312, -0.1786327362060547, -0.17173004150390625, -0.1648273468017578, -0.15792465209960938, -0.15102195739746094, -0.1441192626953125, -0.13721656799316406, -0.13031387329101562, -0.12341117858886719, -0.11650848388671875, -0.10960578918457031, -0.10270309448242188, -0.09580039978027344, -0.088897705078125, -0.08199501037597656, -0.07509231567382812, -0.06818962097167969, -0.06128692626953125, -0.05438423156738281, -0.047481536865234375, -0.04057884216308594, -0.0336761474609375, -0.026773452758789062, -0.019870758056640625, -0.012968063354492188, -0.00606536865234375, 0.0008373260498046875, 0.007740020751953125, 0.014642715454101562, 0.02154541015625, 0.028448104858398438, 0.035350799560546875, 0.04225349426269531, 0.04915618896484375, 0.05605888366699219, 0.06296157836914062, 0.06986427307128906, 0.0767669677734375, 0.08366966247558594, 0.09057235717773438, 0.09747505187988281, 0.10437774658203125, 0.11128044128417969, 0.11818313598632812, 0.12508583068847656, 0.131988525390625, 0.13889122009277344, 0.14579391479492188, 0.1526966094970703, 0.15959930419921875, 0.1665019989013672, 0.17340469360351562, 0.18030738830566406, 0.1872100830078125, 0.19411277770996094, 0.20101547241210938, 0.2079181671142578, 0.21482086181640625, 0.2217235565185547, 0.22862625122070312, 0.23552894592285156, 0.242431640625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 9.0, 8.0, 21.0, 27.0, 44.0, 74.0, 131.0, 167.0, 181.0, 121.0, 79.0, 46.0, 32.0, 22.0, 14.0, 10.0, 6.0, 3.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000255584716796875, -0.00024810247123241425, -0.0002406202256679535, -0.00023313798010349274, -0.00022565573453903198, -0.00021817348897457123, -0.00021069124341011047, -0.00020320899784564972, -0.00019572675228118896, -0.0001882445067167282, -0.00018076226115226746, -0.0001732800155878067, -0.00016579777002334595, -0.0001583155244588852, -0.00015083327889442444, -0.00014335103332996368, -0.00013586878776550293, -0.00012838654220104218, -0.00012090429663658142, -0.00011342205107212067, -0.00010593980550765991, -9.845755994319916e-05, -9.09753143787384e-05, -8.349306881427765e-05, -7.60108232498169e-05, -6.852857768535614e-05, -6.104633212089539e-05, -5.356408655643463e-05, -4.608184099197388e-05, -3.859959542751312e-05, -3.111734986305237e-05, -2.3635104298591614e-05, -1.615285873413086e-05, -8.670613169670105e-06, -1.1883676052093506e-06, 6.293877959251404e-06, 1.3776123523712158e-05, 2.1258369088172913e-05, 2.8740614652633667e-05, 3.622286021709442e-05, 4.3705105781555176e-05, 5.118735134601593e-05, 5.8669596910476685e-05, 6.615184247493744e-05, 7.36340880393982e-05, 8.111633360385895e-05, 8.85985791683197e-05, 9.608082473278046e-05, 0.00010356307029724121, 0.00011104531586170197, 0.00011852756142616272, 0.00012600980699062347, 0.00013349205255508423, 0.00014097429811954498, 0.00014845654368400574, 0.0001559387892484665, 0.00016342103481292725, 0.000170903280377388, 0.00017838552594184875, 0.0001858677715063095, 0.00019335001707077026, 0.00020083226263523102, 0.00020831450819969177, 0.00021579675376415253, 0.00022327899932861328]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 10.0, 7.0, 8.0, 21.0, 39.0, 43.0, 84.0, 116.0, 215.0, 412.0, 871.0, 2221.0, 6615.0, 30306.0, 225387.0, 634629.0, 121391.0, 18317.0, 4576.0, 1658.0, 763.0, 367.0, 187.0, 106.0, 79.0, 39.0, 27.0, 16.0, 13.0, 12.0, 3.0, 6.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.2222900390625, -0.216339111328125, -0.21038818359375, -0.204437255859375, -0.198486328125, -0.192535400390625, -0.18658447265625, -0.180633544921875, -0.1746826171875, -0.168731689453125, -0.16278076171875, -0.156829833984375, -0.15087890625, -0.144927978515625, -0.13897705078125, -0.133026123046875, -0.1270751953125, -0.121124267578125, -0.11517333984375, -0.109222412109375, -0.103271484375, -0.097320556640625, -0.09136962890625, -0.085418701171875, -0.0794677734375, -0.073516845703125, -0.06756591796875, -0.061614990234375, -0.0556640625, -0.049713134765625, -0.04376220703125, -0.037811279296875, -0.0318603515625, -0.025909423828125, -0.01995849609375, -0.014007568359375, -0.008056640625, -0.002105712890625, 0.00384521484375, 0.009796142578125, 0.0157470703125, 0.021697998046875, 0.02764892578125, 0.033599853515625, 0.03955078125, 0.045501708984375, 0.05145263671875, 0.057403564453125, 0.0633544921875, 0.069305419921875, 0.07525634765625, 0.081207275390625, 0.087158203125, 0.093109130859375, 0.09906005859375, 0.105010986328125, 0.1109619140625, 0.116912841796875, 0.12286376953125, 0.128814697265625, 0.134765625, 0.140716552734375, 0.14666748046875, 0.152618408203125, 0.1585693359375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 7.0, 7.0, 10.0, 12.0, 20.0, 34.0, 29.0, 58.0, 53.0, 83.0, 120.0, 129.0, 111.0, 80.0, 65.0, 54.0, 35.0, 34.0, 17.0, 14.0, 8.0, 9.0, 5.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2205810546875, -0.2140178680419922, -0.20745468139648438, -0.20089149475097656, -0.19432830810546875, -0.18776512145996094, -0.18120193481445312, -0.1746387481689453, -0.1680755615234375, -0.1615123748779297, -0.15494918823242188, -0.14838600158691406, -0.14182281494140625, -0.13525962829589844, -0.12869644165039062, -0.12213325500488281, -0.115570068359375, -0.10900688171386719, -0.10244369506835938, -0.09588050842285156, -0.08931732177734375, -0.08275413513183594, -0.07619094848632812, -0.06962776184082031, -0.0630645751953125, -0.05650138854980469, -0.049938201904296875, -0.04337501525878906, -0.03681182861328125, -0.030248641967773438, -0.023685455322265625, -0.017122268676757812, -0.01055908203125, -0.0039958953857421875, 0.002567291259765625, 0.009130477905273438, 0.01569366455078125, 0.022256851196289062, 0.028820037841796875, 0.03538322448730469, 0.0419464111328125, 0.04850959777832031, 0.055072784423828125, 0.06163597106933594, 0.06819915771484375, 0.07476234436035156, 0.08132553100585938, 0.08788871765136719, 0.094451904296875, 0.10101509094238281, 0.10757827758789062, 0.11414146423339844, 0.12070465087890625, 0.12726783752441406, 0.13383102416992188, 0.1403942108154297, 0.1469573974609375, 0.1535205841064453, 0.16008377075195312, 0.16664695739746094, 0.17321014404296875, 0.17977333068847656, 0.18633651733398438, 0.1928997039794922, 0.199462890625]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 5.0, 3.0, 14.0, 18.0, 25.0, 58.0, 86.0, 120.0, 173.0, 163.0, 134.0, 97.0, 58.0, 30.0, 13.0, 4.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4668079614639282, -1.3636301755905151, -1.260452389717102, -1.1572747230529785, -1.0540969371795654, -0.9509191513061523, -0.8477413654327393, -0.744563639163971, -0.6413858532905579, -0.5382080674171448, -0.43503034114837646, -0.3318525552749634, -0.22867479920387268, -0.12549704313278198, -0.022319257259368896, 0.08085846900939941, 0.1840362548828125, 0.2872140109539032, 0.3903917670249939, 0.493569552898407, 0.5967472791671753, 0.6999250650405884, 0.8031028509140015, 0.9062805771827698, 1.009458303451538, 1.1126360893249512, 1.2158138751983643, 1.3189916610717773, 1.4221693277359009, 1.525347113609314, 1.628524899482727, 1.7317025661468506, 1.8348805904388428, 1.9380583763122559, 2.041236162185669, 2.144413948059082, 2.247591733932495, 2.350769519805908, 2.453947067260742, 2.5571248531341553, 2.6603026390075684, 2.7634804248809814, 2.8666582107543945, 2.9698359966278076, 3.0730137825012207, 3.1761913299560547, 3.279369354248047, 3.382546901702881, 3.485724925994873, 3.588902711868286, 3.692080497741699, 3.7952582836151123, 3.8984360694885254, 4.001613616943359, 4.104791641235352, 4.2079691886901855, 4.3111467361450195, 4.4143242835998535, 4.517502307891846, 4.62067985534668, 4.723857879638672, 4.827035427093506, 4.930213451385498, 5.033390998840332, 5.136569023132324]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 4.0, 3.0, 5.0, 2.0, 5.0, 6.0, 9.0, 12.0, 11.0, 13.0, 24.0, 33.0, 27.0, 33.0, 37.0, 35.0, 46.0, 46.0, 41.0, 51.0, 48.0, 51.0, 51.0, 51.0, 46.0, 48.0, 43.0, 27.0, 43.0, 27.0, 24.0, 22.0, 18.0, 17.0, 13.0, 11.0, 4.0, 4.0, 6.0, 5.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6598448753356934, -2.5676393508911133, -2.475433826446533, -2.383228302001953, -2.291022777557373, -2.198817253112793, -2.106611728668213, -2.014406204223633, -1.9222005605697632, -1.829995036125183, -1.737789511680603, -1.6455838680267334, -1.5533783435821533, -1.4611728191375732, -1.3689672946929932, -1.276761770248413, -1.184556245803833, -1.092350721359253, -1.0001451969146729, -0.907939612865448, -0.8157340884208679, -0.7235285639762878, -0.631322979927063, -0.5391174554824829, -0.44691193103790283, -0.35470640659332275, -0.2625008523464203, -0.17029529809951782, -0.07808977365493774, 0.014115750789642334, 0.10632133483886719, 0.19852685928344727, 0.29073238372802734, 0.3829379081726074, 0.4751434624195099, 0.5673490166664124, 0.6595545411109924, 0.7517600655555725, 0.8439656496047974, 0.9361711740493774, 1.0283766984939575, 1.1205822229385376, 1.2127877473831177, 1.3049933910369873, 1.3971989154815674, 1.4894044399261475, 1.5816099643707275, 1.6738154888153076, 1.7660210132598877, 1.8582265377044678, 1.9504320621490479, 2.042637586593628, 2.134843111038208, 2.227048635482788, 2.3192543983459473, 2.4114599227905273, 2.5036654472351074, 2.5958709716796875, 2.6880764961242676, 2.7802820205688477, 2.8724875450134277, 2.964693069458008, 3.056898593902588, 3.149104118347168, 3.241309642791748]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 5.0, 11.0, 20.0, 24.0, 30.0, 43.0, 102.0, 206.0, 585.0, 2145.0, 13381.0, 4039464.0, 130696.0, 5554.0, 1294.0, 405.0, 148.0, 74.0, 40.0, 16.0, 14.0, 9.0, 5.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.154296875, -1.1273269653320312, -1.1003570556640625, -1.0733871459960938, -1.046417236328125, -1.0194473266601562, -0.9924774169921875, -0.9655075073242188, -0.93853759765625, -0.9115676879882812, -0.8845977783203125, -0.8576278686523438, -0.830657958984375, -0.8036880493164062, -0.7767181396484375, -0.7497482299804688, -0.7227783203125, -0.6958084106445312, -0.6688385009765625, -0.6418685913085938, -0.614898681640625, -0.5879287719726562, -0.5609588623046875, -0.5339889526367188, -0.50701904296875, -0.48004913330078125, -0.4530792236328125, -0.42610931396484375, -0.399139404296875, -0.37216949462890625, -0.3451995849609375, -0.31822967529296875, -0.291259765625, -0.26428985595703125, -0.2373199462890625, -0.21035003662109375, -0.183380126953125, -0.15641021728515625, -0.1294403076171875, -0.10247039794921875, -0.07550048828125, -0.04853057861328125, -0.0215606689453125, 0.00540924072265625, 0.032379150390625, 0.05934906005859375, 0.0863189697265625, 0.11328887939453125, 0.1402587890625, 0.16722869873046875, 0.1941986083984375, 0.22116851806640625, 0.248138427734375, 0.27510833740234375, 0.3020782470703125, 0.32904815673828125, 0.35601806640625, 0.38298797607421875, 0.4099578857421875, 0.43692779541015625, 0.463897705078125, 0.49086761474609375, 0.5178375244140625, 0.5448074340820312, 0.57177734375]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 2.0, 1.0, 1.0, 5.0, 4.0, 6.0, 12.0, 9.0, 7.0, 19.0, 33.0, 49.0, 59.0, 67.0, 83.0, 96.0, 95.0, 102.0, 76.0, 59.0, 64.0, 49.0, 31.0, 19.0, 19.0, 17.0, 13.0, 5.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1851806640625, -0.17846107482910156, -0.17174148559570312, -0.1650218963623047, -0.15830230712890625, -0.1515827178955078, -0.14486312866210938, -0.13814353942871094, -0.1314239501953125, -0.12470436096191406, -0.11798477172851562, -0.11126518249511719, -0.10454559326171875, -0.09782600402832031, -0.09110641479492188, -0.08438682556152344, -0.077667236328125, -0.07094764709472656, -0.06422805786132812, -0.05750846862792969, -0.05078887939453125, -0.04406929016113281, -0.037349700927734375, -0.030630111694335938, -0.0239105224609375, -0.017190933227539062, -0.010471343994140625, -0.0037517547607421875, 0.00296783447265625, 0.009687423706054688, 0.016407012939453125, 0.023126602172851562, 0.02984619140625, 0.03656578063964844, 0.043285369873046875, 0.05000495910644531, 0.05672454833984375, 0.06344413757324219, 0.07016372680664062, 0.07688331604003906, 0.0836029052734375, 0.09032249450683594, 0.09704208374023438, 0.10376167297363281, 0.11048126220703125, 0.11720085144042969, 0.12392044067382812, 0.13064002990722656, 0.137359619140625, 0.14407920837402344, 0.15079879760742188, 0.1575183868408203, 0.16423797607421875, 0.1709575653076172, 0.17767715454101562, 0.18439674377441406, 0.1911163330078125, 0.19783592224121094, 0.20455551147460938, 0.2112751007080078, 0.21799468994140625, 0.2247142791748047, 0.23143386840820312, 0.23815345764160156, 0.244873046875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 3.0, 2.0, 9.0, 10.0, 7.0, 11.0, 13.0, 26.0, 31.0, 54.0, 65.0, 82.0, 134.0, 178.0, 284.0, 467.0, 726.0, 1397.0, 2562.0, 5511.0, 13043.0, 41612.0, 351863.0, 3656497.0, 82923.0, 20436.0, 7994.0, 3606.0, 1867.0, 1078.0, 627.0, 411.0, 249.0, 164.0, 103.0, 78.0, 51.0, 37.0, 23.0, 15.0, 9.0, 8.0, 12.0, 7.0, 6.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.23828125, -0.23064804077148438, -0.22301483154296875, -0.21538162231445312, -0.2077484130859375, -0.20011520385742188, -0.19248199462890625, -0.18484878540039062, -0.177215576171875, -0.16958236694335938, -0.16194915771484375, -0.15431594848632812, -0.1466827392578125, -0.13904953002929688, -0.13141632080078125, -0.12378311157226562, -0.11614990234375, -0.10851669311523438, -0.10088348388671875, -0.09325027465820312, -0.0856170654296875, -0.07798385620117188, -0.07035064697265625, -0.06271743774414062, -0.055084228515625, -0.047451019287109375, -0.03981781005859375, -0.032184600830078125, -0.0245513916015625, -0.016918182373046875, -0.00928497314453125, -0.001651763916015625, 0.0059814453125, 0.013614654541015625, 0.02124786376953125, 0.028881072998046875, 0.0365142822265625, 0.044147491455078125, 0.05178070068359375, 0.059413909912109375, 0.067047119140625, 0.07468032836914062, 0.08231353759765625, 0.08994674682617188, 0.0975799560546875, 0.10521316528320312, 0.11284637451171875, 0.12047958374023438, 0.12811279296875, 0.13574600219726562, 0.14337921142578125, 0.15101242065429688, 0.1586456298828125, 0.16627883911132812, 0.17391204833984375, 0.18154525756835938, 0.189178466796875, 0.19681167602539062, 0.20444488525390625, 0.21207809448242188, 0.2197113037109375, 0.22734451293945312, 0.23497772216796875, 0.24261093139648438, 0.250244140625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 6.0, 8.0, 15.0, 25.0, 46.0, 91.0, 312.0, 3134.0, 264.0, 75.0, 31.0, 17.0, 11.0, 9.0, 13.0, 5.0, 4.0, 4.0, 2.0, 4.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0972900390625, -0.0944662094116211, -0.09164237976074219, -0.08881855010986328, -0.08599472045898438, -0.08317089080810547, -0.08034706115722656, -0.07752323150634766, -0.07469940185546875, -0.07187557220458984, -0.06905174255371094, -0.06622791290283203, -0.06340408325195312, -0.06058025360107422, -0.05775642395019531, -0.054932594299316406, -0.0521087646484375, -0.049284934997558594, -0.04646110534667969, -0.04363727569580078, -0.040813446044921875, -0.03798961639404297, -0.03516578674316406, -0.032341957092285156, -0.02951812744140625, -0.026694297790527344, -0.023870468139648438, -0.02104663848876953, -0.018222808837890625, -0.015398979187011719, -0.012575149536132812, -0.009751319885253906, -0.006927490234375, -0.004103660583496094, -0.0012798309326171875, 0.0015439987182617188, 0.004367828369140625, 0.007191658020019531, 0.010015487670898438, 0.012839317321777344, 0.01566314697265625, 0.018486976623535156, 0.021310806274414062, 0.02413463592529297, 0.026958465576171875, 0.02978229522705078, 0.03260612487792969, 0.035429954528808594, 0.0382537841796875, 0.041077613830566406, 0.04390144348144531, 0.04672527313232422, 0.049549102783203125, 0.05237293243408203, 0.05519676208496094, 0.058020591735839844, 0.06084442138671875, 0.06366825103759766, 0.06649208068847656, 0.06931591033935547, 0.07213973999023438, 0.07496356964111328, 0.07778739929199219, 0.0806112289428711, 0.08343505859375]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 19.0, 56.0, 154.0, 294.0, 285.0, 147.0, 40.0, 18.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16496023535728455, -0.14373484253883362, -0.12250944972038269, -0.10128405690193176, -0.08005866408348083, -0.05883327126502991, -0.03760787844657898, -0.016382485628128052, 0.004842907190322876, 0.026068300008773804, 0.04729369282722473, 0.06851908564567566, 0.08974447846412659, 0.11096987128257751, 0.13219526410102844, 0.15342065691947937, 0.1746460497379303, 0.19587144255638123, 0.21709683537483215, 0.23832222819328308, 0.259547621011734, 0.28077301383018494, 0.30199840664863586, 0.3232237994670868, 0.3444491922855377, 0.36567458510398865, 0.3868999779224396, 0.4081253707408905, 0.42935076355934143, 0.45057615637779236, 0.4718015491962433, 0.4930269420146942, 0.5142523050308228, 0.5354776978492737, 0.5567030906677246, 0.5779284834861755, 0.5991538763046265, 0.6203792691230774, 0.6416046619415283, 0.6628300547599792, 0.6840554475784302, 0.7052808403968811, 0.726506233215332, 0.747731626033783, 0.7689570188522339, 0.7901824116706848, 0.8114078044891357, 0.8326331973075867, 0.8538585901260376, 0.8750839829444885, 0.8963093757629395, 0.9175347685813904, 0.9387601613998413, 0.9599855542182922, 0.9812109470367432, 1.0024363994598389, 1.023661732673645, 1.0448870658874512, 1.0661125183105469, 1.0873379707336426, 1.1085633039474487, 1.1297886371612549, 1.1510140895843506, 1.1722395420074463, 1.1934648752212524]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 6.0, 2.0, 3.0, 6.0, 11.0, 12.0, 10.0, 14.0, 20.0, 18.0, 18.0, 29.0, 32.0, 23.0, 31.0, 34.0, 39.0, 50.0, 65.0, 44.0, 53.0, 48.0, 51.0, 27.0, 47.0, 38.0, 35.0, 33.0, 31.0, 32.0, 29.0, 13.0, 21.0, 19.0, 15.0, 11.0, 14.0, 7.0, 5.0, 6.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.14011520147323608, -0.13536687195301056, -0.13061852753162384, -0.12587019801139832, -0.12112186849117279, -0.11637353152036667, -0.11162519454956055, -0.10687686502933502, -0.1021285280585289, -0.09738019108772278, -0.09263186156749725, -0.08788352459669113, -0.08313518762588501, -0.07838685810565948, -0.07363852113485336, -0.06889018416404724, -0.06414185464382172, -0.05939352139830589, -0.05464518815279007, -0.04989685118198395, -0.045148517936468124, -0.0404001846909523, -0.03565184772014618, -0.030903514474630356, -0.026155181229114532, -0.02140684798359871, -0.016658512875437737, -0.011910178698599339, -0.0071618445217609406, -0.002413511276245117, 0.0023348238319158554, 0.007083158940076828, 0.011831492185592651, 0.016579825431108475, 0.021328160539269447, 0.02607649564743042, 0.030824828892946243, 0.03557316213846207, 0.04032149910926819, 0.04506983235478401, 0.049818165600299835, 0.05456649884581566, 0.05931483209133148, 0.0640631690621376, 0.06881150603294373, 0.07355983555316925, 0.07830817252397537, 0.0830565094947815, 0.08780483901500702, 0.09255317598581314, 0.09730150550603867, 0.10204984247684479, 0.10679817199707031, 0.11154650896787643, 0.11629484593868256, 0.12104317545890808, 0.1257915198802948, 0.13053984940052032, 0.13528819382190704, 0.14003652334213257, 0.1447848528623581, 0.14953318238258362, 0.15428152680397034, 0.15902985632419586, 0.1637781858444214]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 9.0, 6.0, 3.0, 14.0, 13.0, 23.0, 41.0, 58.0, 93.0, 149.0, 299.0, 618.0, 1330.0, 3100.0, 9602.0, 40256.0, 267894.0, 576998.0, 117094.0, 20935.0, 5984.0, 2179.0, 891.0, 418.0, 208.0, 124.0, 88.0, 49.0, 28.0, 19.0, 14.0, 5.0, 2.0, 7.0, 6.0, 1.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.44873046875, -0.43341064453125, -0.4180908203125, -0.40277099609375, -0.387451171875, -0.37213134765625, -0.3568115234375, -0.34149169921875, -0.326171875, -0.31085205078125, -0.2955322265625, -0.28021240234375, -0.264892578125, -0.24957275390625, -0.2342529296875, -0.21893310546875, -0.20361328125, -0.18829345703125, -0.1729736328125, -0.15765380859375, -0.142333984375, -0.12701416015625, -0.1116943359375, -0.09637451171875, -0.0810546875, -0.06573486328125, -0.0504150390625, -0.03509521484375, -0.019775390625, -0.00445556640625, 0.0108642578125, 0.02618408203125, 0.04150390625, 0.05682373046875, 0.0721435546875, 0.08746337890625, 0.102783203125, 0.11810302734375, 0.1334228515625, 0.14874267578125, 0.1640625, 0.17938232421875, 0.1947021484375, 0.21002197265625, 0.225341796875, 0.24066162109375, 0.2559814453125, 0.27130126953125, 0.28662109375, 0.30194091796875, 0.3172607421875, 0.33258056640625, 0.347900390625, 0.36322021484375, 0.3785400390625, 0.39385986328125, 0.4091796875, 0.42449951171875, 0.4398193359375, 0.45513916015625, 0.470458984375, 0.48577880859375, 0.5010986328125, 0.51641845703125, 0.53173828125]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 1.0, 1.0, 2.0, 4.0, 5.0, 5.0, 7.0, 11.0, 7.0, 15.0, 26.0, 46.0, 60.0, 68.0, 77.0, 76.0, 112.0, 91.0, 90.0, 67.0, 61.0, 45.0, 41.0, 19.0, 27.0, 18.0, 12.0, 4.0, 4.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.189208984375, -0.18241500854492188, -0.17562103271484375, -0.16882705688476562, -0.1620330810546875, -0.15523910522460938, -0.14844512939453125, -0.14165115356445312, -0.134857177734375, -0.12806320190429688, -0.12126922607421875, -0.11447525024414062, -0.1076812744140625, -0.10088729858398438, -0.09409332275390625, -0.08729934692382812, -0.08050537109375, -0.07371139526367188, -0.06691741943359375, -0.060123443603515625, -0.0533294677734375, -0.046535491943359375, -0.03974151611328125, -0.032947540283203125, -0.026153564453125, -0.019359588623046875, -0.01256561279296875, -0.005771636962890625, 0.0010223388671875, 0.007816314697265625, 0.01461029052734375, 0.021404266357421875, 0.0281982421875, 0.034992218017578125, 0.04178619384765625, 0.048580169677734375, 0.0553741455078125, 0.062168121337890625, 0.06896209716796875, 0.07575607299804688, 0.082550048828125, 0.08934402465820312, 0.09613800048828125, 0.10293197631835938, 0.1097259521484375, 0.11651992797851562, 0.12331390380859375, 0.13010787963867188, 0.13690185546875, 0.14369583129882812, 0.15048980712890625, 0.15728378295898438, 0.1640777587890625, 0.17087173461914062, 0.17766571044921875, 0.18445968627929688, 0.191253662109375, 0.19804763793945312, 0.20484161376953125, 0.21163558959960938, 0.2184295654296875, 0.22522354125976562, 0.23201751708984375, 0.23881149291992188, 0.24560546875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 3.0, 7.0, 8.0, 12.0, 22.0, 30.0, 75.0, 130.0, 230.0, 607.0, 1954.0, 9839.0, 191732.0, 803800.0, 34306.0, 3995.0, 1048.0, 388.0, 161.0, 84.0, 39.0, 31.0, 17.0, 10.0, 8.0, 7.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.80517578125, -0.7794113159179688, -0.7536468505859375, -0.7278823852539062, -0.702117919921875, -0.6763534545898438, -0.6505889892578125, -0.6248245239257812, -0.59906005859375, -0.5732955932617188, -0.5475311279296875, -0.5217666625976562, -0.496002197265625, -0.47023773193359375, -0.4444732666015625, -0.41870880126953125, -0.3929443359375, -0.36717987060546875, -0.3414154052734375, -0.31565093994140625, -0.289886474609375, -0.26412200927734375, -0.2383575439453125, -0.21259307861328125, -0.18682861328125, -0.16106414794921875, -0.1352996826171875, -0.10953521728515625, -0.083770751953125, -0.05800628662109375, -0.0322418212890625, -0.00647735595703125, 0.019287109375, 0.04505157470703125, 0.0708160400390625, 0.09658050537109375, 0.122344970703125, 0.14810943603515625, 0.1738739013671875, 0.19963836669921875, 0.22540283203125, 0.25116729736328125, 0.2769317626953125, 0.30269622802734375, 0.328460693359375, 0.35422515869140625, 0.3799896240234375, 0.40575408935546875, 0.4315185546875, 0.45728302001953125, 0.4830474853515625, 0.5088119506835938, 0.534576416015625, 0.5603408813476562, 0.5861053466796875, 0.6118698120117188, 0.63763427734375, 0.6633987426757812, 0.6891632080078125, 0.7149276733398438, 0.740692138671875, 0.7664566040039062, 0.7922210693359375, 0.8179855346679688, 0.84375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 4.0, 4.0, 1.0, 6.0, 3.0, 5.0, 5.0, 11.0, 13.0, 20.0, 25.0, 34.0, 42.0, 50.0, 50.0, 40.0, 67.0, 47.0, 62.0, 50.0, 52.0, 77.0, 58.0, 54.0, 48.0, 40.0, 23.0, 25.0, 23.0, 15.0, 16.0, 8.0, 7.0, 9.0, 3.0, 2.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.7509765625, -0.72625732421875, -0.7015380859375, -0.67681884765625, -0.652099609375, -0.62738037109375, -0.6026611328125, -0.57794189453125, -0.55322265625, -0.52850341796875, -0.5037841796875, -0.47906494140625, -0.454345703125, -0.42962646484375, -0.4049072265625, -0.38018798828125, -0.35546875, -0.33074951171875, -0.3060302734375, -0.28131103515625, -0.256591796875, -0.23187255859375, -0.2071533203125, -0.18243408203125, -0.15771484375, -0.13299560546875, -0.1082763671875, -0.08355712890625, -0.058837890625, -0.03411865234375, -0.0093994140625, 0.01531982421875, 0.0400390625, 0.06475830078125, 0.0894775390625, 0.11419677734375, 0.138916015625, 0.16363525390625, 0.1883544921875, 0.21307373046875, 0.23779296875, 0.26251220703125, 0.2872314453125, 0.31195068359375, 0.336669921875, 0.36138916015625, 0.3861083984375, 0.41082763671875, 0.435546875, 0.46026611328125, 0.4849853515625, 0.50970458984375, 0.534423828125, 0.55914306640625, 0.5838623046875, 0.60858154296875, 0.63330078125, 0.65802001953125, 0.6827392578125, 0.70745849609375, 0.732177734375, 0.75689697265625, 0.7816162109375, 0.80633544921875, 0.8310546875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 4.0, 6.0, 9.0, 11.0, 12.0, 15.0, 20.0, 24.0, 38.0, 52.0, 96.0, 147.0, 242.0, 519.0, 1287.0, 4695.0, 45954.0, 920259.0, 67026.0, 5390.0, 1479.0, 541.0, 288.0, 125.0, 92.0, 65.0, 36.0, 26.0, 19.0, 22.0, 14.0, 6.0, 9.0, 6.0, 7.0, 3.0, 0.0, 3.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 4.0], "bins": [-0.427734375, -0.41498565673828125, -0.4022369384765625, -0.38948822021484375, -0.376739501953125, -0.36399078369140625, -0.3512420654296875, -0.33849334716796875, -0.32574462890625, -0.31299591064453125, -0.3002471923828125, -0.28749847412109375, -0.274749755859375, -0.26200103759765625, -0.2492523193359375, -0.23650360107421875, -0.2237548828125, -0.21100616455078125, -0.1982574462890625, -0.18550872802734375, -0.172760009765625, -0.16001129150390625, -0.1472625732421875, -0.13451385498046875, -0.12176513671875, -0.10901641845703125, -0.0962677001953125, -0.08351898193359375, -0.070770263671875, -0.05802154541015625, -0.0452728271484375, -0.03252410888671875, -0.019775390625, -0.00702667236328125, 0.0057220458984375, 0.01847076416015625, 0.031219482421875, 0.04396820068359375, 0.0567169189453125, 0.06946563720703125, 0.08221435546875, 0.09496307373046875, 0.1077117919921875, 0.12046051025390625, 0.133209228515625, 0.14595794677734375, 0.1587066650390625, 0.17145538330078125, 0.1842041015625, 0.19695281982421875, 0.2097015380859375, 0.22245025634765625, 0.235198974609375, 0.24794769287109375, 0.2606964111328125, 0.27344512939453125, 0.28619384765625, 0.29894256591796875, 0.3116912841796875, 0.32444000244140625, 0.337188720703125, 0.34993743896484375, 0.3626861572265625, 0.37543487548828125, 0.38818359375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 5.0, 8.0, 10.0, 18.0, 22.0, 35.0, 60.0, 80.0, 119.0, 117.0, 111.0, 124.0, 94.0, 73.0, 45.0, 23.0, 23.0, 12.0, 8.0, 6.0, 9.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.522106170654297e-05, -7.06017017364502e-05, -6.598234176635742e-05, -6.136298179626465e-05, -5.6743621826171875e-05, -5.21242618560791e-05, -4.750490188598633e-05, -4.2885541915893555e-05, -3.826618194580078e-05, -3.364682197570801e-05, -2.9027462005615234e-05, -2.440810203552246e-05, -1.9788742065429688e-05, -1.5169382095336914e-05, -1.055002212524414e-05, -5.930662155151367e-06, -1.3113021850585938e-06, 3.3080577850341797e-06, 7.927417755126953e-06, 1.2546777725219727e-05, 1.71661376953125e-05, 2.1785497665405273e-05, 2.6404857635498047e-05, 3.102421760559082e-05, 3.5643577575683594e-05, 4.026293754577637e-05, 4.488229751586914e-05, 4.9501657485961914e-05, 5.412101745605469e-05, 5.874037742614746e-05, 6.335973739624023e-05, 6.797909736633301e-05, 7.259845733642578e-05, 7.721781730651855e-05, 8.183717727661133e-05, 8.64565372467041e-05, 9.107589721679688e-05, 9.569525718688965e-05, 0.00010031461715698242, 0.0001049339771270752, 0.00010955333709716797, 0.00011417269706726074, 0.00011879205703735352, 0.0001234114170074463, 0.00012803077697753906, 0.00013265013694763184, 0.0001372694969177246, 0.00014188885688781738, 0.00014650821685791016, 0.00015112757682800293, 0.0001557469367980957, 0.00016036629676818848, 0.00016498565673828125, 0.00016960501670837402, 0.0001742243766784668, 0.00017884373664855957, 0.00018346309661865234, 0.00018808245658874512, 0.0001927018165588379, 0.00019732117652893066, 0.00020194053649902344, 0.0002065598964691162, 0.00021117925643920898, 0.00021579861640930176, 0.00022041797637939453]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 3.0, 3.0, 4.0, 8.0, 8.0, 16.0, 14.0, 32.0, 55.0, 111.0, 229.0, 582.0, 1733.0, 7077.0, 76156.0, 853990.0, 97379.0, 8149.0, 1854.0, 640.0, 251.0, 108.0, 50.0, 28.0, 18.0, 11.0, 12.0, 3.0, 4.0, 10.0, 1.0, 3.0, 2.0, 1.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.34716796875, -0.3373985290527344, -0.32762908935546875, -0.3178596496582031, -0.3080902099609375, -0.2983207702636719, -0.28855133056640625, -0.2787818908691406, -0.269012451171875, -0.2592430114746094, -0.24947357177734375, -0.23970413208007812, -0.2299346923828125, -0.22016525268554688, -0.21039581298828125, -0.20062637329101562, -0.19085693359375, -0.18108749389648438, -0.17131805419921875, -0.16154861450195312, -0.1517791748046875, -0.14200973510742188, -0.13224029541015625, -0.12247085571289062, -0.112701416015625, -0.10293197631835938, -0.09316253662109375, -0.08339309692382812, -0.0736236572265625, -0.06385421752929688, -0.05408477783203125, -0.044315338134765625, -0.0345458984375, -0.024776458740234375, -0.01500701904296875, -0.005237579345703125, 0.0045318603515625, 0.014301300048828125, 0.02407073974609375, 0.033840179443359375, 0.043609619140625, 0.053379058837890625, 0.06314849853515625, 0.07291793823242188, 0.0826873779296875, 0.09245681762695312, 0.10222625732421875, 0.11199569702148438, 0.12176513671875, 0.13153457641601562, 0.14130401611328125, 0.15107345581054688, 0.1608428955078125, 0.17061233520507812, 0.18038177490234375, 0.19015121459960938, 0.199920654296875, 0.20969009399414062, 0.21945953369140625, 0.22922897338867188, 0.2389984130859375, 0.24876785278320312, 0.25853729248046875, 0.2683067321777344, 0.278076171875]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 4.0, 10.0, 5.0, 13.0, 23.0, 25.0, 54.0, 85.0, 110.0, 138.0, 178.0, 125.0, 81.0, 57.0, 25.0, 18.0, 15.0, 6.0, 8.0, 3.0, 6.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.35791015625, -0.3473472595214844, -0.33678436279296875, -0.3262214660644531, -0.3156585693359375, -0.3050956726074219, -0.29453277587890625, -0.2839698791503906, -0.273406982421875, -0.2628440856933594, -0.25228118896484375, -0.24171829223632812, -0.2311553955078125, -0.22059249877929688, -0.21002960205078125, -0.19946670532226562, -0.18890380859375, -0.17834091186523438, -0.16777801513671875, -0.15721511840820312, -0.1466522216796875, -0.13608932495117188, -0.12552642822265625, -0.11496353149414062, -0.104400634765625, -0.09383773803710938, -0.08327484130859375, -0.07271194458007812, -0.0621490478515625, -0.051586151123046875, -0.04102325439453125, -0.030460357666015625, -0.0198974609375, -0.009334564208984375, 0.00122833251953125, 0.011791229248046875, 0.0223541259765625, 0.032917022705078125, 0.04347991943359375, 0.054042816162109375, 0.064605712890625, 0.07516860961914062, 0.08573150634765625, 0.09629440307617188, 0.1068572998046875, 0.11742019653320312, 0.12798309326171875, 0.13854598999023438, 0.14910888671875, 0.15967178344726562, 0.17023468017578125, 0.18079757690429688, 0.1913604736328125, 0.20192337036132812, 0.21248626708984375, 0.22304916381835938, 0.233612060546875, 0.24417495727539062, 0.25473785400390625, 0.2653007507324219, 0.2758636474609375, 0.2864265441894531, 0.29698944091796875, 0.3075523376464844, 0.318115234375]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 5.0, 8.0, 11.0, 26.0, 68.0, 110.0, 208.0, 237.0, 165.0, 101.0, 43.0, 10.0, 9.0, 2.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.714663505554199, -5.53700065612793, -5.35933780670166, -5.181674957275391, -5.004011631011963, -4.826348781585693, -4.648685932159424, -4.471023082733154, -4.293359756469727, -4.115696907043457, -3.9380338191986084, -3.760370969772339, -3.5827078819274902, -3.4050450325012207, -3.227382183074951, -3.0497193336486816, -2.872056484222412, -2.6943936347961426, -2.516730546951294, -2.3390676975250244, -2.161404609680176, -1.9837417602539062, -1.8060789108276367, -1.6284159421920776, -1.4507529735565186, -1.2730900049209595, -1.0954270362854004, -0.9177641868591309, -0.7401012182235718, -0.5624382495880127, -0.38477540016174316, -0.20711243152618408, -0.029449939727783203, 0.1482129991054535, 0.3258759379386902, 0.5035388469696045, 0.6812018156051636, 0.8588647842407227, 1.0365276336669922, 1.2141906023025513, 1.3918535709381104, 1.5695165395736694, 1.7471795082092285, 1.924842357635498, 2.1025052070617676, 2.280168294906616, 2.4578311443328857, 2.6354942321777344, 2.813157081604004, 2.9908199310302734, 3.168483018875122, 3.3461458683013916, 3.5238089561462402, 3.7014718055725098, 3.8791346549987793, 4.056797504425049, 4.234460830688477, 4.412123680114746, 4.589786529541016, 4.767449378967285, 4.945112705230713, 5.122775554656982, 5.300438404083252, 5.4781012535095215, 5.655764102935791]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 7.0, 8.0, 11.0, 11.0, 14.0, 18.0, 18.0, 19.0, 30.0, 29.0, 53.0, 35.0, 59.0, 56.0, 58.0, 75.0, 55.0, 63.0, 62.0, 42.0, 53.0, 35.0, 23.0, 33.0, 32.0, 12.0, 10.0, 19.0, 13.0, 11.0, 10.0, 7.0, 5.0, 5.0, 3.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.7983930110931396, -3.6759300231933594, -3.553467035293579, -3.431004047393799, -3.3085408210754395, -3.1860780715942383, -3.063614845275879, -2.9411518573760986, -2.8186888694763184, -2.696225881576538, -2.573762893676758, -2.4512999057769775, -2.3288369178771973, -2.206373691558838, -2.0839107036590576, -1.9614477157592773, -1.838984727859497, -1.7165217399597168, -1.5940587520599365, -1.4715956449508667, -1.3491326570510864, -1.2266696691513062, -1.1042065620422363, -0.981743574142456, -0.8592805862426758, -0.7368175983428955, -0.6143545508384705, -0.4918915331363678, -0.36942851543426514, -0.24696552753448486, -0.12450248003005981, -0.0020394325256347656, 0.12042379379272461, 0.24288681149482727, 0.36534982919692993, 0.4878128468990326, 0.6102758646011353, 0.7327388525009155, 0.8552019000053406, 0.9776649475097656, 1.100127935409546, 1.2225909233093262, 1.3450539112091064, 1.4675170183181763, 1.5899800062179565, 1.7124429941177368, 1.8349061012268066, 1.957369089126587, 2.079832077026367, 2.2022950649261475, 2.3247580528259277, 2.447221040725708, 2.5696840286254883, 2.6921472549438477, 2.814610242843628, 2.937073230743408, 3.0595362186431885, 3.1819992065429688, 3.304462194442749, 3.4269251823425293, 3.5493884086608887, 3.67185115814209, 3.794314384460449, 3.9167773723602295, 4.03924036026001]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 0.0, 2.0, 5.0, 4.0, 10.0, 11.0, 15.0, 19.0, 26.0, 30.0, 48.0, 103.0, 172.0, 373.0, 870.0, 2275.0, 7394.0, 40694.0, 3831087.0, 283635.0, 19770.0, 4768.0, 1621.0, 666.0, 296.0, 145.0, 85.0, 51.0, 34.0, 28.0, 17.0, 12.0, 5.0, 5.0, 5.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.61767578125, -0.6025428771972656, -0.5874099731445312, -0.5722770690917969, -0.5571441650390625, -0.5420112609863281, -0.5268783569335938, -0.5117454528808594, -0.496612548828125, -0.4814796447753906, -0.46634674072265625, -0.4512138366699219, -0.4360809326171875, -0.4209480285644531, -0.40581512451171875, -0.3906822204589844, -0.37554931640625, -0.3604164123535156, -0.34528350830078125, -0.3301506042480469, -0.3150177001953125, -0.2998847961425781, -0.28475189208984375, -0.2696189880371094, -0.254486083984375, -0.23935317993164062, -0.22422027587890625, -0.20908737182617188, -0.1939544677734375, -0.17882156372070312, -0.16368865966796875, -0.14855575561523438, -0.1334228515625, -0.11828994750976562, -0.10315704345703125, -0.08802413940429688, -0.0728912353515625, -0.057758331298828125, -0.04262542724609375, -0.027492523193359375, -0.012359619140625, 0.002773284912109375, 0.01790618896484375, 0.033039093017578125, 0.0481719970703125, 0.06330490112304688, 0.07843780517578125, 0.09357070922851562, 0.10870361328125, 0.12383651733398438, 0.13896942138671875, 0.15410232543945312, 0.1692352294921875, 0.18436813354492188, 0.19950103759765625, 0.21463394165039062, 0.229766845703125, 0.24489974975585938, 0.26003265380859375, 0.2751655578613281, 0.2902984619140625, 0.3054313659667969, 0.32056427001953125, 0.3356971740722656, 0.350830078125]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 2.0, 4.0, 6.0, 9.0, 11.0, 10.0, 20.0, 19.0, 28.0, 31.0, 57.0, 61.0, 65.0, 85.0, 89.0, 84.0, 97.0, 66.0, 47.0, 54.0, 49.0, 26.0, 27.0, 17.0, 16.0, 8.0, 6.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.189453125, -0.18270111083984375, -0.1759490966796875, -0.16919708251953125, -0.162445068359375, -0.15569305419921875, -0.1489410400390625, -0.14218902587890625, -0.13543701171875, -0.12868499755859375, -0.1219329833984375, -0.11518096923828125, -0.108428955078125, -0.10167694091796875, -0.0949249267578125, -0.08817291259765625, -0.0814208984375, -0.07466888427734375, -0.0679168701171875, -0.06116485595703125, -0.054412841796875, -0.04766082763671875, -0.0409088134765625, -0.03415679931640625, -0.02740478515625, -0.02065277099609375, -0.0139007568359375, -0.00714874267578125, -0.000396728515625, 0.00635528564453125, 0.0131072998046875, 0.01985931396484375, 0.026611328125, 0.03336334228515625, 0.0401153564453125, 0.04686737060546875, 0.053619384765625, 0.06037139892578125, 0.0671234130859375, 0.07387542724609375, 0.08062744140625, 0.08737945556640625, 0.0941314697265625, 0.10088348388671875, 0.107635498046875, 0.11438751220703125, 0.1211395263671875, 0.12789154052734375, 0.1346435546875, 0.14139556884765625, 0.1481475830078125, 0.15489959716796875, 0.161651611328125, 0.16840362548828125, 0.1751556396484375, 0.18190765380859375, 0.18865966796875, 0.19541168212890625, 0.2021636962890625, 0.20891571044921875, 0.215667724609375, 0.22241973876953125, 0.2291717529296875, 0.23592376708984375, 0.24267578125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 6.0, 6.0, 6.0, 11.0, 15.0, 20.0, 38.0, 50.0, 74.0, 126.0, 142.0, 278.0, 478.0, 899.0, 1875.0, 4630.0, 15585.0, 105456.0, 3853984.0, 179843.0, 20549.0, 5602.0, 2224.0, 996.0, 536.0, 291.0, 177.0, 127.0, 85.0, 48.0, 42.0, 24.0, 19.0, 11.0, 10.0, 8.0, 5.0, 6.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.397705078125, -0.3851165771484375, -0.372528076171875, -0.3599395751953125, -0.34735107421875, -0.3347625732421875, -0.322174072265625, -0.3095855712890625, -0.2969970703125, -0.2844085693359375, -0.271820068359375, -0.2592315673828125, -0.24664306640625, -0.2340545654296875, -0.221466064453125, -0.2088775634765625, -0.1962890625, -0.1837005615234375, -0.171112060546875, -0.1585235595703125, -0.14593505859375, -0.1333465576171875, -0.120758056640625, -0.1081695556640625, -0.0955810546875, -0.0829925537109375, -0.070404052734375, -0.0578155517578125, -0.04522705078125, -0.0326385498046875, -0.020050048828125, -0.0074615478515625, 0.005126953125, 0.0177154541015625, 0.030303955078125, 0.0428924560546875, 0.05548095703125, 0.0680694580078125, 0.080657958984375, 0.0932464599609375, 0.1058349609375, 0.1184234619140625, 0.131011962890625, 0.1436004638671875, 0.15618896484375, 0.1687774658203125, 0.181365966796875, 0.1939544677734375, 0.20654296875, 0.2191314697265625, 0.231719970703125, 0.2443084716796875, 0.25689697265625, 0.2694854736328125, 0.282073974609375, 0.2946624755859375, 0.3072509765625, 0.3198394775390625, 0.332427978515625, 0.3450164794921875, 0.35760498046875, 0.3701934814453125, 0.382781982421875, 0.3953704833984375, 0.407958984375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 12.0, 15.0, 21.0, 49.0, 135.0, 489.0, 2912.0, 253.0, 96.0, 32.0, 21.0, 15.0, 6.0, 5.0, 0.0, 5.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1610107421875, -0.1563262939453125, -0.151641845703125, -0.1469573974609375, -0.14227294921875, -0.1375885009765625, -0.132904052734375, -0.1282196044921875, -0.12353515625, -0.1188507080078125, -0.114166259765625, -0.1094818115234375, -0.10479736328125, -0.1001129150390625, -0.095428466796875, -0.0907440185546875, -0.0860595703125, -0.0813751220703125, -0.076690673828125, -0.0720062255859375, -0.06732177734375, -0.0626373291015625, -0.057952880859375, -0.0532684326171875, -0.048583984375, -0.0438995361328125, -0.039215087890625, -0.0345306396484375, -0.02984619140625, -0.0251617431640625, -0.020477294921875, -0.0157928466796875, -0.0111083984375, -0.0064239501953125, -0.001739501953125, 0.0029449462890625, 0.00762939453125, 0.0123138427734375, 0.016998291015625, 0.0216827392578125, 0.0263671875, 0.0310516357421875, 0.035736083984375, 0.0404205322265625, 0.04510498046875, 0.0497894287109375, 0.054473876953125, 0.0591583251953125, 0.0638427734375, 0.0685272216796875, 0.073211669921875, 0.0778961181640625, 0.08258056640625, 0.0872650146484375, 0.091949462890625, 0.0966339111328125, 0.101318359375, 0.1060028076171875, 0.110687255859375, 0.1153717041015625, 0.12005615234375, 0.1247406005859375, 0.129425048828125, 0.1341094970703125, 0.1387939453125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 4.0, 18.0, 29.0, 64.0, 105.0, 148.0, 196.0, 170.0, 137.0, 71.0, 44.0, 12.0, 8.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.9417344331741333, -0.923327624797821, -0.9049208164215088, -0.8865140676498413, -0.868107259273529, -0.8497004508972168, -0.8312937021255493, -0.8128868937492371, -0.7944800853729248, -0.7760732769966125, -0.7576664686203003, -0.7392597198486328, -0.7208529114723206, -0.7024461030960083, -0.6840393543243408, -0.6656325459480286, -0.6472257375717163, -0.628818929195404, -0.6104121208190918, -0.5920053720474243, -0.5735985636711121, -0.5551917552947998, -0.5367850065231323, -0.5183781981468201, -0.4999713897705078, -0.48156458139419556, -0.4631578028202057, -0.4447510242462158, -0.42634421586990356, -0.4079374074935913, -0.38953062891960144, -0.3711238503456116, -0.3527171015739441, -0.33431029319763184, -0.31590351462364197, -0.2974967360496521, -0.27908992767333984, -0.2606831192970276, -0.24227634072303772, -0.22386954724788666, -0.2054627537727356, -0.18705596029758453, -0.16864916682243347, -0.1502423733472824, -0.13183557987213135, -0.11342878639698029, -0.09502199292182922, -0.07661519944667816, -0.0582084059715271, -0.03980161249637604, -0.021394819021224976, -0.0029880255460739136, 0.015418767929077148, 0.03382556140422821, 0.05223235487937927, 0.07063914835453033, 0.0890459418296814, 0.10745273530483246, 0.12585952877998352, 0.14426632225513458, 0.16267311573028564, 0.1810799092054367, 0.19948670268058777, 0.21789349615573883, 0.2363002896308899]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 1.0, 8.0, 8.0, 17.0, 12.0, 11.0, 10.0, 20.0, 18.0, 20.0, 24.0, 32.0, 27.0, 41.0, 43.0, 34.0, 37.0, 47.0, 51.0, 35.0, 44.0, 47.0, 46.0, 37.0, 41.0, 27.0, 25.0, 35.0, 32.0, 19.0, 26.0, 25.0, 20.0, 19.0, 11.0, 16.0, 7.0, 4.0, 9.0, 4.0, 5.0, 1.0, 3.0, 3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0], "bins": [-0.23878049850463867, -0.2317516803741455, -0.22472284734249115, -0.2176940143108368, -0.21066519618034363, -0.20363637804985046, -0.1966075450181961, -0.18957871198654175, -0.18254989385604858, -0.17552107572555542, -0.16849224269390106, -0.1614634096622467, -0.15443459153175354, -0.14740577340126038, -0.14037694036960602, -0.13334810733795166, -0.1263192892074585, -0.11929046362638474, -0.11226163804531097, -0.10523281246423721, -0.09820398688316345, -0.09117516130208969, -0.08414633572101593, -0.07711751013994217, -0.07008868455886841, -0.06305985897779465, -0.056031033396720886, -0.049002207815647125, -0.041973382234573364, -0.0349445566534996, -0.027915731072425842, -0.02088690549135208, -0.01385807991027832, -0.006829254329204559, 0.00019957125186920166, 0.007228396832942963, 0.014257222414016724, 0.021286047995090485, 0.028314873576164246, 0.03534369915723801, 0.04237252473831177, 0.04940135031938553, 0.05643017590045929, 0.06345900148153305, 0.07048782706260681, 0.07751665264368057, 0.08454547822475433, 0.0915743038058281, 0.09860312938690186, 0.10563195496797562, 0.11266078054904938, 0.11968960613012314, 0.1267184317111969, 0.13374724984169006, 0.14077608287334442, 0.14780491590499878, 0.15483373403549194, 0.1618625521659851, 0.16889138519763947, 0.17592021822929382, 0.182949036359787, 0.18997785449028015, 0.1970066875219345, 0.20403552055358887, 0.21106433868408203]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 8.0, 6.0, 17.0, 17.0, 27.0, 36.0, 101.0, 139.0, 281.0, 544.0, 1100.0, 3105.0, 9596.0, 39409.0, 204935.0, 538578.0, 197740.0, 38295.0, 9313.0, 2995.0, 1163.0, 520.0, 269.0, 144.0, 85.0, 55.0, 26.0, 13.0, 13.0, 9.0, 7.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.41015625, -0.3992156982421875, -0.388275146484375, -0.3773345947265625, -0.36639404296875, -0.3554534912109375, -0.344512939453125, -0.3335723876953125, -0.3226318359375, -0.3116912841796875, -0.300750732421875, -0.2898101806640625, -0.27886962890625, -0.2679290771484375, -0.256988525390625, -0.2460479736328125, -0.235107421875, -0.2241668701171875, -0.213226318359375, -0.2022857666015625, -0.19134521484375, -0.1804046630859375, -0.169464111328125, -0.1585235595703125, -0.1475830078125, -0.1366424560546875, -0.125701904296875, -0.1147613525390625, -0.10382080078125, -0.0928802490234375, -0.081939697265625, -0.0709991455078125, -0.06005859375, -0.0491180419921875, -0.038177490234375, -0.0272369384765625, -0.01629638671875, -0.0053558349609375, 0.005584716796875, 0.0165252685546875, 0.0274658203125, 0.0384063720703125, 0.049346923828125, 0.0602874755859375, 0.07122802734375, 0.0821685791015625, 0.093109130859375, 0.1040496826171875, 0.114990234375, 0.1259307861328125, 0.136871337890625, 0.1478118896484375, 0.15875244140625, 0.1696929931640625, 0.180633544921875, 0.1915740966796875, 0.2025146484375, 0.2134552001953125, 0.224395751953125, 0.2353363037109375, 0.24627685546875, 0.2572174072265625, 0.268157958984375, 0.2790985107421875, 0.2900390625]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 6.0, 2.0, 8.0, 9.0, 18.0, 19.0, 18.0, 20.0, 37.0, 39.0, 62.0, 66.0, 66.0, 72.0, 83.0, 94.0, 78.0, 58.0, 53.0, 41.0, 39.0, 42.0, 17.0, 18.0, 10.0, 6.0, 6.0, 8.0, 1.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18896484375, -0.18257522583007812, -0.17618560791015625, -0.16979598999023438, -0.1634063720703125, -0.15701675415039062, -0.15062713623046875, -0.14423751831054688, -0.137847900390625, -0.13145828247070312, -0.12506866455078125, -0.11867904663085938, -0.1122894287109375, -0.10589981079101562, -0.09951019287109375, -0.09312057495117188, -0.08673095703125, -0.08034133911132812, -0.07395172119140625, -0.06756210327148438, -0.0611724853515625, -0.054782867431640625, -0.04839324951171875, -0.042003631591796875, -0.035614013671875, -0.029224395751953125, -0.02283477783203125, -0.016445159912109375, -0.0100555419921875, -0.003665924072265625, 0.00272369384765625, 0.009113311767578125, 0.0155029296875, 0.021892547607421875, 0.02828216552734375, 0.034671783447265625, 0.0410614013671875, 0.047451019287109375, 0.05384063720703125, 0.060230255126953125, 0.066619873046875, 0.07300949096679688, 0.07939910888671875, 0.08578872680664062, 0.0921783447265625, 0.09856796264648438, 0.10495758056640625, 0.11134719848632812, 0.11773681640625, 0.12412643432617188, 0.13051605224609375, 0.13690567016601562, 0.1432952880859375, 0.14968490600585938, 0.15607452392578125, 0.16246414184570312, 0.168853759765625, 0.17524337768554688, 0.18163299560546875, 0.18802261352539062, 0.1944122314453125, 0.20080184936523438, 0.20719146728515625, 0.21358108520507812, 0.219970703125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 6.0, 4.0, 4.0, 8.0, 5.0, 5.0, 6.0, 13.0, 9.0, 19.0, 37.0, 60.0, 90.0, 179.0, 491.0, 1630.0, 10121.0, 322327.0, 693195.0, 17001.0, 2233.0, 592.0, 238.0, 104.0, 67.0, 38.0, 23.0, 11.0, 12.0, 2.0, 6.0, 9.0, 6.0, 3.0, 2.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.6201171875, -0.594390869140625, -0.56866455078125, -0.542938232421875, -0.5172119140625, -0.491485595703125, -0.46575927734375, -0.440032958984375, -0.414306640625, -0.388580322265625, -0.36285400390625, -0.337127685546875, -0.3114013671875, -0.285675048828125, -0.25994873046875, -0.234222412109375, -0.20849609375, -0.182769775390625, -0.15704345703125, -0.131317138671875, -0.1055908203125, -0.079864501953125, -0.05413818359375, -0.028411865234375, -0.002685546875, 0.023040771484375, 0.04876708984375, 0.074493408203125, 0.1002197265625, 0.125946044921875, 0.15167236328125, 0.177398681640625, 0.203125, 0.228851318359375, 0.25457763671875, 0.280303955078125, 0.3060302734375, 0.331756591796875, 0.35748291015625, 0.383209228515625, 0.408935546875, 0.434661865234375, 0.46038818359375, 0.486114501953125, 0.5118408203125, 0.537567138671875, 0.56329345703125, 0.589019775390625, 0.61474609375, 0.640472412109375, 0.66619873046875, 0.691925048828125, 0.7176513671875, 0.743377685546875, 0.76910400390625, 0.794830322265625, 0.820556640625, 0.846282958984375, 0.87200927734375, 0.897735595703125, 0.9234619140625, 0.949188232421875, 0.97491455078125, 1.000640869140625, 1.0263671875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 4.0, 2.0, 3.0, 9.0, 4.0, 4.0, 5.0, 8.0, 10.0, 11.0, 13.0, 14.0, 17.0, 24.0, 38.0, 30.0, 40.0, 33.0, 51.0, 60.0, 62.0, 54.0, 56.0, 52.0, 78.0, 59.0, 42.0, 35.0, 28.0, 28.0, 21.0, 24.0, 14.0, 9.0, 13.0, 8.0, 6.0, 4.0, 5.0, 2.0, 7.0, 6.0, 0.0, 5.0, 2.0, 3.0, 3.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 3.0], "bins": [-0.68896484375, -0.6676483154296875, -0.646331787109375, -0.6250152587890625, -0.60369873046875, -0.5823822021484375, -0.561065673828125, -0.5397491455078125, -0.5184326171875, -0.4971160888671875, -0.475799560546875, -0.4544830322265625, -0.43316650390625, -0.4118499755859375, -0.390533447265625, -0.3692169189453125, -0.347900390625, -0.3265838623046875, -0.305267333984375, -0.2839508056640625, -0.26263427734375, -0.2413177490234375, -0.220001220703125, -0.1986846923828125, -0.1773681640625, -0.1560516357421875, -0.134735107421875, -0.1134185791015625, -0.09210205078125, -0.0707855224609375, -0.049468994140625, -0.0281524658203125, -0.0068359375, 0.0144805908203125, 0.035797119140625, 0.0571136474609375, 0.07843017578125, 0.0997467041015625, 0.121063232421875, 0.1423797607421875, 0.1636962890625, 0.1850128173828125, 0.206329345703125, 0.2276458740234375, 0.24896240234375, 0.2702789306640625, 0.291595458984375, 0.3129119873046875, 0.334228515625, 0.3555450439453125, 0.376861572265625, 0.3981781005859375, 0.41949462890625, 0.4408111572265625, 0.462127685546875, 0.4834442138671875, 0.5047607421875, 0.5260772705078125, 0.547393798828125, 0.5687103271484375, 0.59002685546875, 0.6113433837890625, 0.632659912109375, 0.6539764404296875, 0.67529296875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 12.0, 20.0, 25.0, 35.0, 90.0, 178.0, 545.0, 2436.0, 53290.0, 969434.0, 20081.0, 1635.0, 416.0, 166.0, 70.0, 41.0, 32.0, 22.0, 5.0, 5.0, 5.0, 5.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.62255859375, -0.6067543029785156, -0.5909500122070312, -0.5751457214355469, -0.5593414306640625, -0.5435371398925781, -0.5277328491210938, -0.5119285583496094, -0.496124267578125, -0.4803199768066406, -0.46451568603515625, -0.4487113952636719, -0.4329071044921875, -0.4171028137207031, -0.40129852294921875, -0.3854942321777344, -0.36968994140625, -0.3538856506347656, -0.33808135986328125, -0.3222770690917969, -0.3064727783203125, -0.2906684875488281, -0.27486419677734375, -0.2590599060058594, -0.243255615234375, -0.22745132446289062, -0.21164703369140625, -0.19584274291992188, -0.1800384521484375, -0.16423416137695312, -0.14842987060546875, -0.13262557983398438, -0.1168212890625, -0.10101699829101562, -0.08521270751953125, -0.06940841674804688, -0.0536041259765625, -0.037799835205078125, -0.02199554443359375, -0.006191253662109375, 0.009613037109375, 0.025417327880859375, 0.04122161865234375, 0.057025909423828125, 0.0728302001953125, 0.08863449096679688, 0.10443878173828125, 0.12024307250976562, 0.13604736328125, 0.15185165405273438, 0.16765594482421875, 0.18346023559570312, 0.1992645263671875, 0.21506881713867188, 0.23087310791015625, 0.24667739868164062, 0.262481689453125, 0.2782859802246094, 0.29409027099609375, 0.3098945617675781, 0.3256988525390625, 0.3415031433105469, 0.35730743408203125, 0.3731117248535156, 0.388916015625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 8.0, 12.0, 22.0, 17.0, 32.0, 28.0, 53.0, 74.0, 78.0, 114.0, 131.0, 113.0, 72.0, 60.0, 61.0, 37.0, 31.0, 21.0, 15.0, 10.0, 11.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010263919830322266, -0.0001000305637717247, -9.742192924022675e-05, -9.481329470872879e-05, -9.220466017723083e-05, -8.959602564573288e-05, -8.698739111423492e-05, -8.437875658273697e-05, -8.177012205123901e-05, -7.916148751974106e-05, -7.65528529882431e-05, -7.394421845674515e-05, -7.133558392524719e-05, -6.872694939374924e-05, -6.611831486225128e-05, -6.350968033075333e-05, -6.090104579925537e-05, -5.8292411267757416e-05, -5.568377673625946e-05, -5.3075142204761505e-05, -5.046650767326355e-05, -4.7857873141765594e-05, -4.524923861026764e-05, -4.2640604078769684e-05, -4.003196954727173e-05, -3.742333501577377e-05, -3.481470048427582e-05, -3.220606595277786e-05, -2.9597431421279907e-05, -2.6988796889781952e-05, -2.4380162358283997e-05, -2.177152782678604e-05, -1.9162893295288086e-05, -1.655425876379013e-05, -1.3945624232292175e-05, -1.133698970079422e-05, -8.728355169296265e-06, -6.119720637798309e-06, -3.511086106300354e-06, -9.024515748023987e-07, 1.7061829566955566e-06, 4.314817488193512e-06, 6.923452019691467e-06, 9.532086551189423e-06, 1.2140721082687378e-05, 1.4749355614185333e-05, 1.735799014568329e-05, 1.9966624677181244e-05, 2.25752592086792e-05, 2.5183893740177155e-05, 2.779252827167511e-05, 3.0401162803173065e-05, 3.300979733467102e-05, 3.5618431866168976e-05, 3.822706639766693e-05, 4.0835700929164886e-05, 4.344433546066284e-05, 4.60529699921608e-05, 4.866160452365875e-05, 5.127023905515671e-05, 5.387887358665466e-05, 5.648750811815262e-05, 5.9096142649650574e-05, 6.170477718114853e-05, 6.431341171264648e-05]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 4.0, 5.0, 3.0, 10.0, 12.0, 22.0, 30.0, 60.0, 122.0, 224.0, 490.0, 1569.0, 6826.0, 113582.0, 860452.0, 58036.0, 4946.0, 1293.0, 458.0, 192.0, 81.0, 55.0, 35.0, 13.0, 18.0, 8.0, 6.0, 6.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.296142578125, -0.2864036560058594, -0.27666473388671875, -0.2669258117675781, -0.2571868896484375, -0.24744796752929688, -0.23770904541015625, -0.22797012329101562, -0.218231201171875, -0.20849227905273438, -0.19875335693359375, -0.18901443481445312, -0.1792755126953125, -0.16953659057617188, -0.15979766845703125, -0.15005874633789062, -0.14031982421875, -0.13058090209960938, -0.12084197998046875, -0.11110305786132812, -0.1013641357421875, -0.09162521362304688, -0.08188629150390625, -0.07214736938476562, -0.062408447265625, -0.052669525146484375, -0.04293060302734375, -0.033191680908203125, -0.0234527587890625, -0.013713836669921875, -0.00397491455078125, 0.005764007568359375, 0.0155029296875, 0.025241851806640625, 0.03498077392578125, 0.044719696044921875, 0.0544586181640625, 0.06419754028320312, 0.07393646240234375, 0.08367538452148438, 0.093414306640625, 0.10315322875976562, 0.11289215087890625, 0.12263107299804688, 0.1323699951171875, 0.14210891723632812, 0.15184783935546875, 0.16158676147460938, 0.17132568359375, 0.18106460571289062, 0.19080352783203125, 0.20054244995117188, 0.2102813720703125, 0.22002029418945312, 0.22975921630859375, 0.23949813842773438, 0.249237060546875, 0.2589759826660156, 0.26871490478515625, 0.2784538269042969, 0.2881927490234375, 0.2979316711425781, 0.30767059326171875, 0.3174095153808594, 0.3271484375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 7.0, 1.0, 4.0, 10.0, 11.0, 24.0, 36.0, 52.0, 73.0, 93.0, 116.0, 121.0, 118.0, 92.0, 77.0, 63.0, 35.0, 20.0, 21.0, 4.0, 8.0, 8.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2467041015625, -0.23842430114746094, -0.23014450073242188, -0.2218647003173828, -0.21358489990234375, -0.2053050994873047, -0.19702529907226562, -0.18874549865722656, -0.1804656982421875, -0.17218589782714844, -0.16390609741210938, -0.1556262969970703, -0.14734649658203125, -0.1390666961669922, -0.13078689575195312, -0.12250709533691406, -0.114227294921875, -0.10594749450683594, -0.09766769409179688, -0.08938789367675781, -0.08110809326171875, -0.07282829284667969, -0.06454849243164062, -0.05626869201660156, -0.0479888916015625, -0.03970909118652344, -0.031429290771484375, -0.023149490356445312, -0.01486968994140625, -0.0065898895263671875, 0.001689910888671875, 0.009969711303710938, 0.01824951171875, 0.026529312133789062, 0.034809112548828125, 0.04308891296386719, 0.05136871337890625, 0.05964851379394531, 0.06792831420898438, 0.07620811462402344, 0.0844879150390625, 0.09276771545410156, 0.10104751586914062, 0.10932731628417969, 0.11760711669921875, 0.1258869171142578, 0.13416671752929688, 0.14244651794433594, 0.150726318359375, 0.15900611877441406, 0.16728591918945312, 0.1755657196044922, 0.18384552001953125, 0.1921253204345703, 0.20040512084960938, 0.20868492126464844, 0.2169647216796875, 0.22524452209472656, 0.23352432250976562, 0.2418041229248047, 0.25008392333984375, 0.2583637237548828, 0.2666435241699219, 0.27492332458496094, 0.283203125]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 2.0, 2.0, 11.0, 14.0, 30.0, 47.0, 82.0, 119.0, 170.0, 174.0, 139.0, 93.0, 60.0, 25.0, 13.0, 13.0, 5.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-5.522227764129639, -5.412898540496826, -5.3035688400268555, -5.194239616394043, -5.084909915924072, -4.97558069229126, -4.866250991821289, -4.756921768188477, -4.647592544555664, -4.538263320922852, -4.428933620452881, -4.319604396820068, -4.210274696350098, -4.100945472717285, -3.9916160106658936, -3.882286548614502, -3.7729570865631104, -3.6636276245117188, -3.554298162460327, -3.4449687004089355, -3.335639476776123, -3.2263100147247314, -3.11698055267334, -3.0076510906219482, -2.8983216285705566, -2.788992166519165, -2.6796627044677734, -2.570333480834961, -2.4610040187835693, -2.3516745567321777, -2.242345094680786, -2.1330156326293945, -2.023686170578003, -1.9143567085266113, -1.8050273656845093, -1.6956979036331177, -1.5863685607910156, -1.477039098739624, -1.3677096366882324, -1.2583801746368408, -1.1490508317947388, -1.0397213697433472, -0.9303920269012451, -0.8210625648498535, -0.7117331624031067, -0.6024037599563599, -0.49307429790496826, -0.38374489545822144, -0.2744154930114746, -0.1650860756635666, -0.05575665831565857, 0.053572773933410645, 0.16290217638015747, 0.2722315788269043, 0.3815610408782959, 0.4908904433250427, 0.6002198457717896, 0.7095492482185364, 0.8188786506652832, 0.9282081127166748, 1.0375375747680664, 1.1468669176101685, 1.25619637966156, 1.365525722503662, 1.4748551845550537]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 5.0, 4.0, 8.0, 10.0, 6.0, 15.0, 12.0, 13.0, 19.0, 15.0, 26.0, 29.0, 34.0, 40.0, 38.0, 51.0, 43.0, 59.0, 50.0, 54.0, 52.0, 48.0, 50.0, 42.0, 37.0, 36.0, 42.0, 36.0, 28.0, 23.0, 16.0, 10.0, 8.0, 8.0, 10.0, 8.0, 4.0, 2.0, 6.0, 3.0, 1.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5343985557556152, -2.4423270225524902, -2.3502554893493652, -2.2581839561462402, -2.1661124229431152, -2.0740408897399902, -1.9819693565368652, -1.8898978233337402, -1.7978262901306152, -1.7057547569274902, -1.6136832237243652, -1.5216116905212402, -1.4295401573181152, -1.3374686241149902, -1.2453970909118652, -1.1533255577087402, -1.0612541437149048, -0.9691826105117798, -0.8771110773086548, -0.7850395441055298, -0.6929680109024048, -0.6008964776992798, -0.5088250041007996, -0.41675347089767456, -0.32468193769454956, -0.23261040449142456, -0.14053888618946075, -0.04846736788749695, 0.04360416531562805, 0.13567569851875305, 0.22774720191955566, 0.31981873512268066, 0.41189026832580566, 0.5039618015289307, 0.5960333347320557, 0.6881048679351807, 0.7801764011383057, 0.8722479343414307, 0.9643194079399109, 1.0563910007476807, 1.1484625339508057, 1.2405340671539307, 1.3326056003570557, 1.4246771335601807, 1.5167486667633057, 1.6088201999664307, 1.7008917331695557, 1.7929632663726807, 1.8850346803665161, 1.9771062135696411, 2.0691776275634766, 2.1612491607666016, 2.2533206939697266, 2.3453922271728516, 2.4374637603759766, 2.5295352935791016, 2.6216068267822266, 2.7136783599853516, 2.8057498931884766, 2.8978214263916016, 2.9898929595947266, 3.0819644927978516, 3.1740360260009766, 3.2661075592041016, 3.3581790924072266]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 12.0, 9.0, 16.0, 32.0, 37.0, 83.0, 180.0, 337.0, 853.0, 3465.0, 30389.0, 4111215.0, 41693.0, 4079.0, 1059.0, 430.0, 177.0, 95.0, 43.0, 31.0, 19.0, 10.0, 7.0, 4.0, 9.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6513671875, -0.6277236938476562, -0.6040802001953125, -0.5804367065429688, -0.556793212890625, -0.5331497192382812, -0.5095062255859375, -0.48586273193359375, -0.46221923828125, -0.43857574462890625, -0.4149322509765625, -0.39128875732421875, -0.367645263671875, -0.34400177001953125, -0.3203582763671875, -0.29671478271484375, -0.2730712890625, -0.24942779541015625, -0.2257843017578125, -0.20214080810546875, -0.178497314453125, -0.15485382080078125, -0.1312103271484375, -0.10756683349609375, -0.08392333984375, -0.06027984619140625, -0.0366363525390625, -0.01299285888671875, 0.010650634765625, 0.03429412841796875, 0.0579376220703125, 0.08158111572265625, 0.105224609375, 0.12886810302734375, 0.1525115966796875, 0.17615509033203125, 0.199798583984375, 0.22344207763671875, 0.2470855712890625, 0.27072906494140625, 0.29437255859375, 0.31801605224609375, 0.3416595458984375, 0.36530303955078125, 0.388946533203125, 0.41259002685546875, 0.4362335205078125, 0.45987701416015625, 0.4835205078125, 0.5071640014648438, 0.5308074951171875, 0.5544509887695312, 0.578094482421875, 0.6017379760742188, 0.6253814697265625, 0.6490249633789062, 0.67266845703125, 0.6963119506835938, 0.7199554443359375, 0.7435989379882812, 0.767242431640625, 0.7908859252929688, 0.8145294189453125, 0.8381729125976562, 0.86181640625]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 2.0, 5.0, 7.0, 5.0, 17.0, 19.0, 28.0, 41.0, 64.0, 76.0, 83.0, 101.0, 105.0, 104.0, 77.0, 78.0, 55.0, 35.0, 34.0, 20.0, 15.0, 16.0, 9.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1805419921875, -0.17220115661621094, -0.16386032104492188, -0.1555194854736328, -0.14717864990234375, -0.1388378143310547, -0.13049697875976562, -0.12215614318847656, -0.1138153076171875, -0.10547447204589844, -0.09713363647460938, -0.08879280090332031, -0.08045196533203125, -0.07211112976074219, -0.06377029418945312, -0.05542945861816406, -0.047088623046875, -0.03874778747558594, -0.030406951904296875, -0.022066116333007812, -0.01372528076171875, -0.0053844451904296875, 0.002956390380859375, 0.011297225952148438, 0.0196380615234375, 0.027978897094726562, 0.036319732666015625, 0.04466056823730469, 0.05300140380859375, 0.06134223937988281, 0.06968307495117188, 0.07802391052246094, 0.08636474609375, 0.09470558166503906, 0.10304641723632812, 0.11138725280761719, 0.11972808837890625, 0.1280689239501953, 0.13640975952148438, 0.14475059509277344, 0.1530914306640625, 0.16143226623535156, 0.16977310180664062, 0.1781139373779297, 0.18645477294921875, 0.1947956085205078, 0.20313644409179688, 0.21147727966308594, 0.219818115234375, 0.22815895080566406, 0.23649978637695312, 0.2448406219482422, 0.25318145751953125, 0.2615222930908203, 0.2698631286621094, 0.27820396423339844, 0.2865447998046875, 0.29488563537597656, 0.3032264709472656, 0.3115673065185547, 0.31990814208984375, 0.3282489776611328, 0.3365898132324219, 0.34493064880371094, 0.353271484375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 3.0, 5.0, 3.0, 10.0, 14.0, 17.0, 41.0, 60.0, 118.0, 157.0, 276.0, 575.0, 948.0, 1875.0, 4273.0, 13271.0, 78377.0, 3869207.0, 192579.0, 21374.0, 5918.0, 2431.0, 1189.0, 671.0, 395.0, 208.0, 130.0, 69.0, 38.0, 16.0, 16.0, 11.0, 7.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2130126953125, -0.20318031311035156, -0.19334793090820312, -0.1835155487060547, -0.17368316650390625, -0.1638507843017578, -0.15401840209960938, -0.14418601989746094, -0.1343536376953125, -0.12452125549316406, -0.11468887329101562, -0.10485649108886719, -0.09502410888671875, -0.08519172668457031, -0.07535934448242188, -0.06552696228027344, -0.055694580078125, -0.04586219787597656, -0.036029815673828125, -0.026197433471679688, -0.01636505126953125, -0.0065326690673828125, 0.003299713134765625, 0.013132095336914062, 0.0229644775390625, 0.03279685974121094, 0.042629241943359375, 0.05246162414550781, 0.06229400634765625, 0.07212638854980469, 0.08195877075195312, 0.09179115295410156, 0.10162353515625, 0.11145591735839844, 0.12128829956054688, 0.1311206817626953, 0.14095306396484375, 0.1507854461669922, 0.16061782836914062, 0.17045021057128906, 0.1802825927734375, 0.19011497497558594, 0.19994735717773438, 0.2097797393798828, 0.21961212158203125, 0.2294445037841797, 0.23927688598632812, 0.24910926818847656, 0.258941650390625, 0.26877403259277344, 0.2786064147949219, 0.2884387969970703, 0.29827117919921875, 0.3081035614013672, 0.3179359436035156, 0.32776832580566406, 0.3376007080078125, 0.34743309020996094, 0.3572654724121094, 0.3670978546142578, 0.37693023681640625, 0.3867626190185547, 0.3965950012207031, 0.40642738342285156, 0.416259765625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 4.0, 1.0, 6.0, 4.0, 4.0, 5.0, 15.0, 34.0, 53.0, 130.0, 435.0, 2986.0, 239.0, 75.0, 41.0, 23.0, 8.0, 7.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07293701171875, -0.06980037689208984, -0.06666374206542969, -0.06352710723876953, -0.060390472412109375, -0.05725383758544922, -0.05411720275878906, -0.050980567932128906, -0.04784393310546875, -0.044707298278808594, -0.04157066345214844, -0.03843402862548828, -0.035297393798828125, -0.03216075897216797, -0.029024124145507812, -0.025887489318847656, -0.0227508544921875, -0.019614219665527344, -0.016477584838867188, -0.013340950012207031, -0.010204315185546875, -0.007067680358886719, -0.0039310455322265625, -0.0007944107055664062, 0.00234222412109375, 0.005478858947753906, 0.008615493774414062, 0.011752128601074219, 0.014888763427734375, 0.01802539825439453, 0.021162033081054688, 0.024298667907714844, 0.027435302734375, 0.030571937561035156, 0.03370857238769531, 0.03684520721435547, 0.039981842041015625, 0.04311847686767578, 0.04625511169433594, 0.049391746520996094, 0.05252838134765625, 0.055665016174316406, 0.05880165100097656, 0.06193828582763672, 0.06507492065429688, 0.06821155548095703, 0.07134819030761719, 0.07448482513427734, 0.0776214599609375, 0.08075809478759766, 0.08389472961425781, 0.08703136444091797, 0.09016799926757812, 0.09330463409423828, 0.09644126892089844, 0.0995779037475586, 0.10271453857421875, 0.1058511734008789, 0.10898780822753906, 0.11212444305419922, 0.11526107788085938, 0.11839771270751953, 0.12153434753417969, 0.12467098236083984, 0.1278076171875]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 5.0, 5.0, 6.0, 9.0, 6.0, 22.0, 26.0, 39.0, 73.0, 92.0, 112.0, 117.0, 96.0, 111.0, 89.0, 61.0, 48.0, 39.0, 19.0, 12.0, 8.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.27748343348503113, -0.269666463136673, -0.2618495225906372, -0.25403255224227905, -0.2462155818939209, -0.23839862644672394, -0.23058167099952698, -0.22276470065116882, -0.21494773030281067, -0.2071307748556137, -0.19931380450725555, -0.1914968490600586, -0.18367987871170044, -0.17586292326450348, -0.16804596781730652, -0.16022899746894836, -0.1524120420217514, -0.14459508657455444, -0.1367781162261963, -0.12896116077899933, -0.12114419043064117, -0.11332723498344421, -0.10551027208566666, -0.0976933091878891, -0.08987634629011154, -0.08205938339233398, -0.07424242049455643, -0.06642545759677887, -0.05860849842429161, -0.05079153552651405, -0.042974576354026794, -0.03515761345624924, -0.027340665459632874, -0.019523702561855316, -0.011706741526722908, -0.0038897804915905, 0.0039271824061870575, 0.011744145303964615, 0.019561104476451874, 0.02737806737422943, 0.03519503027200699, 0.043011993169784546, 0.0508289560675621, 0.05864591524004936, 0.06646287441253662, 0.07427984476089478, 0.08209680020809174, 0.0899137631058693, 0.09773072600364685, 0.10554768890142441, 0.11336465179920197, 0.12118160724639893, 0.12899857759475708, 0.13681553304195404, 0.144632488489151, 0.15244945883750916, 0.1602664291858673, 0.16808338463306427, 0.17590035498142242, 0.18371731042861938, 0.19153428077697754, 0.1993512362241745, 0.20716819167137146, 0.21498516201972961, 0.22280211746692657]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 6.0, 7.0, 4.0, 8.0, 14.0, 12.0, 19.0, 25.0, 22.0, 24.0, 27.0, 38.0, 37.0, 50.0, 47.0, 36.0, 49.0, 50.0, 54.0, 41.0, 49.0, 56.0, 41.0, 44.0, 47.0, 29.0, 30.0, 32.0, 18.0, 25.0, 12.0, 8.0, 6.0, 8.0, 3.0, 8.0, 3.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0], "bins": [-0.18881118297576904, -0.1834801435470581, -0.17814911901950836, -0.17281809449195862, -0.16748705506324768, -0.16215601563453674, -0.156824991106987, -0.15149396657943726, -0.14616292715072632, -0.14083188772201538, -0.13550086319446564, -0.1301698386669159, -0.12483879923820496, -0.11950776726007462, -0.11417673528194427, -0.10884570330381393, -0.1035146713256836, -0.09818363934755325, -0.09285260736942291, -0.08752157539129257, -0.08219054341316223, -0.07685951143503189, -0.07152847945690155, -0.06619744747877121, -0.06086641550064087, -0.05553538352251053, -0.05020435154438019, -0.04487331956624985, -0.03954228758811951, -0.034211255609989166, -0.028880223631858826, -0.023549191653728485, -0.018218159675598145, -0.012887127697467804, -0.007556095719337463, -0.002225063741207123, 0.0031059682369232178, 0.008437000215053558, 0.013768032193183899, 0.01909906417131424, 0.02443009614944458, 0.02976112812757492, 0.03509216010570526, 0.0404231920838356, 0.04575422406196594, 0.05108525604009628, 0.056416288018226624, 0.061747319996356964, 0.0670783519744873, 0.07240938395261765, 0.07774041593074799, 0.08307144790887833, 0.08840247988700867, 0.09373351186513901, 0.09906454384326935, 0.10439557582139969, 0.10972660779953003, 0.11505763977766037, 0.12038867175579071, 0.12571969628334045, 0.1310507357120514, 0.13638177514076233, 0.14171279966831207, 0.14704382419586182, 0.15237486362457275]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 11.0, 14.0, 11.0, 22.0, 38.0, 56.0, 98.0, 203.0, 511.0, 1495.0, 7078.0, 72822.0, 755439.0, 193431.0, 13774.0, 2312.0, 679.0, 270.0, 127.0, 72.0, 36.0, 19.0, 11.0, 10.0, 4.0, 3.0, 2.0, 1.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.351806640625, -0.3355674743652344, -0.31932830810546875, -0.3030891418457031, -0.2868499755859375, -0.2706108093261719, -0.25437164306640625, -0.23813247680664062, -0.221893310546875, -0.20565414428710938, -0.18941497802734375, -0.17317581176757812, -0.1569366455078125, -0.14069747924804688, -0.12445831298828125, -0.10821914672851562, -0.09197998046875, -0.07574081420898438, -0.05950164794921875, -0.043262481689453125, -0.0270233154296875, -0.010784149169921875, 0.00545501708984375, 0.021694183349609375, 0.037933349609375, 0.054172515869140625, 0.07041168212890625, 0.08665084838867188, 0.1028900146484375, 0.11912918090820312, 0.13536834716796875, 0.15160751342773438, 0.1678466796875, 0.18408584594726562, 0.20032501220703125, 0.21656417846679688, 0.2328033447265625, 0.24904251098632812, 0.26528167724609375, 0.2815208435058594, 0.297760009765625, 0.3139991760253906, 0.33023834228515625, 0.3464775085449219, 0.3627166748046875, 0.3789558410644531, 0.39519500732421875, 0.4114341735839844, 0.42767333984375, 0.4439125061035156, 0.46015167236328125, 0.4763908386230469, 0.4926300048828125, 0.5088691711425781, 0.5251083374023438, 0.5413475036621094, 0.557586669921875, 0.5738258361816406, 0.5900650024414062, 0.6063041687011719, 0.6225433349609375, 0.6387825012207031, 0.6550216674804688, 0.6712608337402344, 0.6875]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 9.0, 6.0, 10.0, 16.0, 23.0, 28.0, 48.0, 66.0, 105.0, 96.0, 89.0, 95.0, 106.0, 68.0, 79.0, 50.0, 28.0, 29.0, 17.0, 11.0, 11.0, 7.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1849365234375, -0.17658424377441406, -0.16823196411132812, -0.1598796844482422, -0.15152740478515625, -0.1431751251220703, -0.13482284545898438, -0.12647056579589844, -0.1181182861328125, -0.10976600646972656, -0.10141372680664062, -0.09306144714355469, -0.08470916748046875, -0.07635688781738281, -0.06800460815429688, -0.05965232849121094, -0.051300048828125, -0.04294776916503906, -0.034595489501953125, -0.026243209838867188, -0.01789093017578125, -0.009538650512695312, -0.001186370849609375, 0.0071659088134765625, 0.0155181884765625, 0.023870468139648438, 0.032222747802734375, 0.04057502746582031, 0.04892730712890625, 0.05727958679199219, 0.06563186645507812, 0.07398414611816406, 0.08233642578125, 0.09068870544433594, 0.09904098510742188, 0.10739326477050781, 0.11574554443359375, 0.12409782409667969, 0.13245010375976562, 0.14080238342285156, 0.1491546630859375, 0.15750694274902344, 0.16585922241210938, 0.1742115020751953, 0.18256378173828125, 0.1909160614013672, 0.19926834106445312, 0.20762062072753906, 0.215972900390625, 0.22432518005371094, 0.23267745971679688, 0.2410297393798828, 0.24938201904296875, 0.2577342987060547, 0.2660865783691406, 0.27443885803222656, 0.2827911376953125, 0.29114341735839844, 0.2994956970214844, 0.3078479766845703, 0.31620025634765625, 0.3245525360107422, 0.3329048156738281, 0.34125709533691406, 0.349609375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 5.0, 7.0, 14.0, 17.0, 29.0, 24.0, 26.0, 42.0, 75.0, 128.0, 227.0, 532.0, 1482.0, 8501.0, 361539.0, 659902.0, 12716.0, 1931.0, 696.0, 242.0, 131.0, 76.0, 62.0, 42.0, 23.0, 20.0, 15.0, 13.0, 7.0, 6.0, 8.0, 3.0, 1.0, 3.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.72021484375, -0.6990814208984375, -0.677947998046875, -0.6568145751953125, -0.63568115234375, -0.6145477294921875, -0.593414306640625, -0.5722808837890625, -0.5511474609375, -0.5300140380859375, -0.508880615234375, -0.4877471923828125, -0.46661376953125, -0.4454803466796875, -0.424346923828125, -0.4032135009765625, -0.382080078125, -0.3609466552734375, -0.339813232421875, -0.3186798095703125, -0.29754638671875, -0.2764129638671875, -0.255279541015625, -0.2341461181640625, -0.2130126953125, -0.1918792724609375, -0.170745849609375, -0.1496124267578125, -0.12847900390625, -0.1073455810546875, -0.086212158203125, -0.0650787353515625, -0.0439453125, -0.0228118896484375, -0.001678466796875, 0.0194549560546875, 0.04058837890625, 0.0617218017578125, 0.082855224609375, 0.1039886474609375, 0.1251220703125, 0.1462554931640625, 0.167388916015625, 0.1885223388671875, 0.20965576171875, 0.2307891845703125, 0.251922607421875, 0.2730560302734375, 0.294189453125, 0.3153228759765625, 0.336456298828125, 0.3575897216796875, 0.37872314453125, 0.3998565673828125, 0.420989990234375, 0.4421234130859375, 0.4632568359375, 0.4843902587890625, 0.505523681640625, 0.5266571044921875, 0.54779052734375, 0.5689239501953125, 0.590057373046875, 0.6111907958984375, 0.63232421875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 4.0, 2.0, 4.0, 3.0, 12.0, 10.0, 10.0, 10.0, 19.0, 14.0, 26.0, 26.0, 21.0, 49.0, 35.0, 35.0, 40.0, 45.0, 44.0, 55.0, 41.0, 47.0, 58.0, 50.0, 33.0, 33.0, 41.0, 32.0, 39.0, 25.0, 26.0, 24.0, 22.0, 13.0, 15.0, 10.0, 10.0, 4.0, 5.0, 2.0, 4.0, 4.0, 3.0, 3.0, 0.0, 2.0, 3.0, 2.0], "bins": [-0.65625, -0.6384353637695312, -0.6206207275390625, -0.6028060913085938, -0.584991455078125, -0.5671768188476562, -0.5493621826171875, -0.5315475463867188, -0.51373291015625, -0.49591827392578125, -0.4781036376953125, -0.46028900146484375, -0.442474365234375, -0.42465972900390625, -0.4068450927734375, -0.38903045654296875, -0.3712158203125, -0.35340118408203125, -0.3355865478515625, -0.31777191162109375, -0.299957275390625, -0.28214263916015625, -0.2643280029296875, -0.24651336669921875, -0.22869873046875, -0.21088409423828125, -0.1930694580078125, -0.17525482177734375, -0.157440185546875, -0.13962554931640625, -0.1218109130859375, -0.10399627685546875, -0.086181640625, -0.06836700439453125, -0.0505523681640625, -0.03273773193359375, -0.014923095703125, 0.00289154052734375, 0.0207061767578125, 0.03852081298828125, 0.05633544921875, 0.07415008544921875, 0.0919647216796875, 0.10977935791015625, 0.127593994140625, 0.14540863037109375, 0.1632232666015625, 0.18103790283203125, 0.1988525390625, 0.21666717529296875, 0.2344818115234375, 0.25229644775390625, 0.270111083984375, 0.28792572021484375, 0.3057403564453125, 0.32355499267578125, 0.34136962890625, 0.35918426513671875, 0.3769989013671875, 0.39481353759765625, 0.412628173828125, 0.43044281005859375, 0.4482574462890625, 0.46607208251953125, 0.48388671875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 3.0, 8.0, 18.0, 31.0, 87.0, 423.0, 3973.0, 1011478.0, 31275.0, 957.0, 195.0, 54.0, 26.0, 13.0, 7.0, 0.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7900390625, -0.7696304321289062, -0.7492218017578125, -0.7288131713867188, -0.708404541015625, -0.6879959106445312, -0.6675872802734375, -0.6471786499023438, -0.62677001953125, -0.6063613891601562, -0.5859527587890625, -0.5655441284179688, -0.545135498046875, -0.5247268676757812, -0.5043182373046875, -0.48390960693359375, -0.4635009765625, -0.44309234619140625, -0.4226837158203125, -0.40227508544921875, -0.381866455078125, -0.36145782470703125, -0.3410491943359375, -0.32064056396484375, -0.30023193359375, -0.27982330322265625, -0.2594146728515625, -0.23900604248046875, -0.218597412109375, -0.19818878173828125, -0.1777801513671875, -0.15737152099609375, -0.136962890625, -0.11655426025390625, -0.0961456298828125, -0.07573699951171875, -0.055328369140625, -0.03491973876953125, -0.0145111083984375, 0.00589752197265625, 0.02630615234375, 0.04671478271484375, 0.0671234130859375, 0.08753204345703125, 0.107940673828125, 0.12834930419921875, 0.1487579345703125, 0.16916656494140625, 0.1895751953125, 0.20998382568359375, 0.2303924560546875, 0.25080108642578125, 0.271209716796875, 0.29161834716796875, 0.3120269775390625, 0.33243560791015625, 0.35284423828125, 0.37325286865234375, 0.3936614990234375, 0.41407012939453125, 0.434478759765625, 0.45488739013671875, 0.4752960205078125, 0.49570465087890625, 0.51611328125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 4.0, 3.0, 4.0, 5.0, 6.0, 8.0, 13.0, 23.0, 13.0, 20.0, 24.0, 16.0, 18.0, 26.0, 39.0, 65.0, 102.0, 68.0, 90.0, 94.0, 84.0, 60.0, 40.0, 53.0, 27.0, 16.0, 18.0, 16.0, 9.0, 7.0, 3.0, 6.0, 5.0, 3.0, 1.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.583597183227539e-05, -4.437938332557678e-05, -4.2922794818878174e-05, -4.1466206312179565e-05, -4.000961780548096e-05, -3.855302929878235e-05, -3.709644079208374e-05, -3.563985228538513e-05, -3.4183263778686523e-05, -3.2726675271987915e-05, -3.127008676528931e-05, -2.9813498258590698e-05, -2.835690975189209e-05, -2.690032124519348e-05, -2.5443732738494873e-05, -2.3987144231796265e-05, -2.2530555725097656e-05, -2.1073967218399048e-05, -1.961737871170044e-05, -1.816079020500183e-05, -1.6704201698303223e-05, -1.5247613191604614e-05, -1.3791024684906006e-05, -1.2334436178207397e-05, -1.0877847671508789e-05, -9.42125916481018e-06, -7.964670658111572e-06, -6.508082151412964e-06, -5.0514936447143555e-06, -3.594905138015747e-06, -2.1383166313171387e-06, -6.817281246185303e-07, 7.748603820800781e-07, 2.2314488887786865e-06, 3.688037395477295e-06, 5.144625902175903e-06, 6.601214408874512e-06, 8.05780291557312e-06, 9.514391422271729e-06, 1.0970979928970337e-05, 1.2427568435668945e-05, 1.3884156942367554e-05, 1.5340745449066162e-05, 1.679733395576477e-05, 1.825392246246338e-05, 1.9710510969161987e-05, 2.1167099475860596e-05, 2.2623687982559204e-05, 2.4080276489257812e-05, 2.553686499595642e-05, 2.699345350265503e-05, 2.8450042009353638e-05, 2.9906630516052246e-05, 3.1363219022750854e-05, 3.281980752944946e-05, 3.427639603614807e-05, 3.573298454284668e-05, 3.718957304954529e-05, 3.8646161556243896e-05, 4.0102750062942505e-05, 4.155933856964111e-05, 4.301592707633972e-05, 4.447251558303833e-05, 4.592910408973694e-05, 4.738569259643555e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 4.0, 13.0, 6.0, 13.0, 33.0, 56.0, 172.0, 514.0, 2456.0, 59857.0, 965500.0, 17770.0, 1538.0, 388.0, 111.0, 47.0, 26.0, 13.0, 16.0, 4.0, 4.0, 4.0, 7.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.541015625, -0.5288200378417969, -0.5166244506835938, -0.5044288635253906, -0.4922332763671875, -0.4800376892089844, -0.46784210205078125, -0.4556465148925781, -0.443450927734375, -0.4312553405761719, -0.41905975341796875, -0.4068641662597656, -0.3946685791015625, -0.3824729919433594, -0.37027740478515625, -0.3580818176269531, -0.34588623046875, -0.3336906433105469, -0.32149505615234375, -0.3092994689941406, -0.2971038818359375, -0.2849082946777344, -0.27271270751953125, -0.2605171203613281, -0.248321533203125, -0.23612594604492188, -0.22393035888671875, -0.21173477172851562, -0.1995391845703125, -0.18734359741210938, -0.17514801025390625, -0.16295242309570312, -0.1507568359375, -0.13856124877929688, -0.12636566162109375, -0.11417007446289062, -0.1019744873046875, -0.08977890014648438, -0.07758331298828125, -0.06538772583007812, -0.053192138671875, -0.040996551513671875, -0.02880096435546875, -0.016605377197265625, -0.0044097900390625, 0.007785797119140625, 0.01998138427734375, 0.032176971435546875, 0.04437255859375, 0.056568145751953125, 0.06876373291015625, 0.08095932006835938, 0.0931549072265625, 0.10535049438476562, 0.11754608154296875, 0.12974166870117188, 0.141937255859375, 0.15413284301757812, 0.16632843017578125, 0.17852401733398438, 0.1907196044921875, 0.20291519165039062, 0.21511077880859375, 0.22730636596679688, 0.239501953125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 8.0, 3.0, 6.0, 5.0, 13.0, 28.0, 40.0, 73.0, 99.0, 112.0, 137.0, 136.0, 108.0, 99.0, 53.0, 33.0, 18.0, 12.0, 9.0, 3.0, 6.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.277099609375, -0.2695655822753906, -0.26203155517578125, -0.2544975280761719, -0.2469635009765625, -0.23942947387695312, -0.23189544677734375, -0.22436141967773438, -0.216827392578125, -0.20929336547851562, -0.20175933837890625, -0.19422531127929688, -0.1866912841796875, -0.17915725708007812, -0.17162322998046875, -0.16408920288085938, -0.15655517578125, -0.14902114868164062, -0.14148712158203125, -0.13395309448242188, -0.1264190673828125, -0.11888504028320312, -0.11135101318359375, -0.10381698608398438, -0.096282958984375, -0.08874893188476562, -0.08121490478515625, -0.07368087768554688, -0.0661468505859375, -0.058612823486328125, -0.05107879638671875, -0.043544769287109375, -0.0360107421875, -0.028476715087890625, -0.02094268798828125, -0.013408660888671875, -0.0058746337890625, 0.001659393310546875, 0.00919342041015625, 0.016727447509765625, 0.024261474609375, 0.031795501708984375, 0.03932952880859375, 0.046863555908203125, 0.0543975830078125, 0.061931610107421875, 0.06946563720703125, 0.07699966430664062, 0.08453369140625, 0.09206771850585938, 0.09960174560546875, 0.10713577270507812, 0.1146697998046875, 0.12220382690429688, 0.12973785400390625, 0.13727188110351562, 0.144805908203125, 0.15233993530273438, 0.15987396240234375, 0.16740798950195312, 0.1749420166015625, 0.18247604370117188, 0.19001007080078125, 0.19754409790039062, 0.205078125]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 8.0, 21.0, 58.0, 216.0, 343.0, 243.0, 86.0, 18.0, 8.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.959199905395508, -5.786752223968506, -5.614304542541504, -5.441856861114502, -5.2694091796875, -5.096961498260498, -4.924513816833496, -4.752066135406494, -4.579618453979492, -4.40717077255249, -4.234723091125488, -4.062275409698486, -3.8898277282714844, -3.7173800468444824, -3.5449323654174805, -3.3724846839904785, -3.2000370025634766, -3.0275893211364746, -2.8551416397094727, -2.6826939582824707, -2.5102462768554688, -2.337798595428467, -2.165350914001465, -1.992903232574463, -1.820455551147461, -1.648007869720459, -1.475560188293457, -1.303112506866455, -1.1306648254394531, -0.9582171440124512, -0.7857694625854492, -0.6133217811584473, -0.4408740997314453, -0.26842641830444336, -0.0959787368774414, 0.07646894454956055, 0.2489166259765625, 0.42136430740356445, 0.5938119888305664, 0.7662596702575684, 0.9387073516845703, 1.1111550331115723, 1.2836027145385742, 1.4560503959655762, 1.6284980773925781, 1.80094575881958, 1.973393440246582, 2.145841121673584, 2.318288803100586, 2.490736484527588, 2.66318416595459, 2.835631847381592, 3.0080795288085938, 3.1805272102355957, 3.3529748916625977, 3.5254225730895996, 3.6978702545166016, 3.8703179359436035, 4.0427656173706055, 4.215213298797607, 4.387660980224609, 4.560108661651611, 4.732556343078613, 4.905004024505615, 5.077451705932617]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 4.0, 7.0, 8.0, 10.0, 15.0, 16.0, 18.0, 26.0, 30.0, 32.0, 41.0, 50.0, 47.0, 52.0, 60.0, 55.0, 83.0, 64.0, 60.0, 43.0, 50.0, 43.0, 38.0, 27.0, 31.0, 25.0, 18.0, 14.0, 8.0, 8.0, 7.0, 5.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.4693262577056885, -3.373845100402832, -3.2783639430999756, -3.182882785797119, -3.087401866912842, -2.9919207096099854, -2.896439552307129, -2.8009583950042725, -2.705477237701416, -2.6099960803985596, -2.514514923095703, -2.4190337657928467, -2.3235526084899902, -2.228071689605713, -2.1325905323028564, -2.037109375, -1.9416282176971436, -1.846147060394287, -1.7506659030914307, -1.6551848649978638, -1.5597037076950073, -1.4642225503921509, -1.368741512298584, -1.2732603549957275, -1.177779197692871, -1.0822980403900146, -0.986816942691803, -0.8913358449935913, -0.7958546876907349, -0.7003735303878784, -0.6048924326896667, -0.5094113349914551, -0.41392993927001953, -0.3184488117694855, -0.22296768426895142, -0.12748655676841736, -0.0320054292678833, 0.06347569823265076, 0.15895682573318481, 0.2544379234313965, 0.34991908073425293, 0.445400208234787, 0.540881335735321, 0.6363624334335327, 0.7318435907363892, 0.8273247480392456, 0.9228058457374573, 1.018286943435669, 1.1137681007385254, 1.2092492580413818, 1.3047304153442383, 1.4002114534378052, 1.4956926107406616, 1.591173768043518, 1.686654806137085, 1.7821359634399414, 1.8776171207427979, 1.9730982780456543, 2.0685794353485107, 2.164060592651367, 2.2595415115356445, 2.355022668838501, 2.4505038261413574, 2.545984983444214, 2.6414661407470703]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 13.0, 4.0, 12.0, 18.0, 51.0, 85.0, 166.0, 364.0, 820.0, 2197.0, 8513.0, 73408.0, 3996158.0, 98321.0, 10029.0, 2495.0, 898.0, 381.0, 182.0, 81.0, 45.0, 16.0, 12.0, 4.0, 2.0, 2.0, 9.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.57470703125, -0.5611991882324219, -0.5476913452148438, -0.5341835021972656, -0.5206756591796875, -0.5071678161621094, -0.49365997314453125, -0.4801521301269531, -0.466644287109375, -0.4531364440917969, -0.43962860107421875, -0.4261207580566406, -0.4126129150390625, -0.3991050720214844, -0.38559722900390625, -0.3720893859863281, -0.35858154296875, -0.3450736999511719, -0.33156585693359375, -0.3180580139160156, -0.3045501708984375, -0.2910423278808594, -0.27753448486328125, -0.2640266418457031, -0.250518798828125, -0.23701095581054688, -0.22350311279296875, -0.20999526977539062, -0.1964874267578125, -0.18297958374023438, -0.16947174072265625, -0.15596389770507812, -0.1424560546875, -0.12894821166992188, -0.11544036865234375, -0.10193252563476562, -0.0884246826171875, -0.07491683959960938, -0.06140899658203125, -0.047901153564453125, -0.034393310546875, -0.020885467529296875, -0.00737762451171875, 0.006130218505859375, 0.0196380615234375, 0.033145904541015625, 0.04665374755859375, 0.060161590576171875, 0.07366943359375, 0.08717727661132812, 0.10068511962890625, 0.11419296264648438, 0.1277008056640625, 0.14120864868164062, 0.15471649169921875, 0.16822433471679688, 0.181732177734375, 0.19524002075195312, 0.20874786376953125, 0.22225570678710938, 0.2357635498046875, 0.24927139282226562, 0.26277923583984375, 0.2762870788574219, 0.289794921875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 7.0, 10.0, 9.0, 15.0, 19.0, 29.0, 37.0, 56.0, 59.0, 81.0, 78.0, 84.0, 84.0, 76.0, 68.0, 53.0, 60.0, 46.0, 42.0, 21.0, 19.0, 15.0, 9.0, 8.0, 6.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17919921875, -0.17284584045410156, -0.16649246215820312, -0.1601390838623047, -0.15378570556640625, -0.1474323272705078, -0.14107894897460938, -0.13472557067871094, -0.1283721923828125, -0.12201881408691406, -0.11566543579101562, -0.10931205749511719, -0.10295867919921875, -0.09660530090332031, -0.09025192260742188, -0.08389854431152344, -0.077545166015625, -0.07119178771972656, -0.06483840942382812, -0.05848503112792969, -0.05213165283203125, -0.04577827453613281, -0.039424896240234375, -0.03307151794433594, -0.0267181396484375, -0.020364761352539062, -0.014011383056640625, -0.0076580047607421875, -0.00130462646484375, 0.0050487518310546875, 0.011402130126953125, 0.017755508422851562, 0.02410888671875, 0.030462265014648438, 0.036815643310546875, 0.04316902160644531, 0.04952239990234375, 0.05587577819824219, 0.062229156494140625, 0.06858253479003906, 0.0749359130859375, 0.08128929138183594, 0.08764266967773438, 0.09399604797363281, 0.10034942626953125, 0.10670280456542969, 0.11305618286132812, 0.11940956115722656, 0.125762939453125, 0.13211631774902344, 0.13846969604492188, 0.1448230743408203, 0.15117645263671875, 0.1575298309326172, 0.16388320922851562, 0.17023658752441406, 0.1765899658203125, 0.18294334411621094, 0.18929672241210938, 0.1956501007080078, 0.20200347900390625, 0.2083568572998047, 0.21471023559570312, 0.22106361389160156, 0.2274169921875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 4.0, 2.0, 2.0, 7.0, 4.0, 5.0, 11.0, 15.0, 16.0, 27.0, 31.0, 28.0, 48.0, 71.0, 93.0, 146.0, 248.0, 390.0, 652.0, 1169.0, 2192.0, 4137.0, 8773.0, 22279.0, 78036.0, 680359.0, 3203491.0, 135978.0, 32822.0, 11866.0, 5235.0, 2620.0, 1419.0, 777.0, 442.0, 286.0, 167.0, 129.0, 73.0, 56.0, 50.0, 36.0, 27.0, 23.0, 16.0, 13.0, 6.0, 3.0, 3.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.14990234375, -0.14493370056152344, -0.13996505737304688, -0.1349964141845703, -0.13002777099609375, -0.1250591278076172, -0.12009048461914062, -0.11512184143066406, -0.1101531982421875, -0.10518455505371094, -0.10021591186523438, -0.09524726867675781, -0.09027862548828125, -0.08530998229980469, -0.08034133911132812, -0.07537269592285156, -0.070404052734375, -0.06543540954589844, -0.060466766357421875, -0.05549812316894531, -0.05052947998046875, -0.04556083679199219, -0.040592193603515625, -0.03562355041503906, -0.0306549072265625, -0.025686264038085938, -0.020717620849609375, -0.015748977661132812, -0.01078033447265625, -0.0058116912841796875, -0.000843048095703125, 0.0041255950927734375, 0.00909423828125, 0.014062881469726562, 0.019031524658203125, 0.024000167846679688, 0.02896881103515625, 0.03393745422363281, 0.038906097412109375, 0.04387474060058594, 0.0488433837890625, 0.05381202697753906, 0.058780670166015625, 0.06374931335449219, 0.06871795654296875, 0.07368659973144531, 0.07865524291992188, 0.08362388610839844, 0.088592529296875, 0.09356117248535156, 0.09852981567382812, 0.10349845886230469, 0.10846710205078125, 0.11343574523925781, 0.11840438842773438, 0.12337303161621094, 0.1283416748046875, 0.13331031799316406, 0.13827896118164062, 0.1432476043701172, 0.14821624755859375, 0.1531848907470703, 0.15815353393554688, 0.16312217712402344, 0.1680908203125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 5.0, 10.0, 9.0, 9.0, 24.0, 32.0, 55.0, 116.0, 322.0, 2361.0, 745.0, 186.0, 87.0, 47.0, 26.0, 15.0, 10.0, 3.0, 6.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0870361328125, -0.08263015747070312, -0.07822418212890625, -0.07381820678710938, -0.0694122314453125, -0.06500625610351562, -0.06060028076171875, -0.056194305419921875, -0.051788330078125, -0.047382354736328125, -0.04297637939453125, -0.038570404052734375, -0.0341644287109375, -0.029758453369140625, -0.02535247802734375, -0.020946502685546875, -0.01654052734375, -0.012134552001953125, -0.00772857666015625, -0.003322601318359375, 0.0010833740234375, 0.005489349365234375, 0.00989532470703125, 0.014301300048828125, 0.018707275390625, 0.023113250732421875, 0.02751922607421875, 0.031925201416015625, 0.0363311767578125, 0.040737152099609375, 0.04514312744140625, 0.049549102783203125, 0.053955078125, 0.058361053466796875, 0.06276702880859375, 0.06717300415039062, 0.0715789794921875, 0.07598495483398438, 0.08039093017578125, 0.08479690551757812, 0.089202880859375, 0.09360885620117188, 0.09801483154296875, 0.10242080688476562, 0.1068267822265625, 0.11123275756835938, 0.11563873291015625, 0.12004470825195312, 0.12445068359375, 0.12885665893554688, 0.13326263427734375, 0.13766860961914062, 0.1420745849609375, 0.14648056030273438, 0.15088653564453125, 0.15529251098632812, 0.159698486328125, 0.16410446166992188, 0.16851043701171875, 0.17291641235351562, 0.1773223876953125, 0.18172836303710938, 0.18613433837890625, 0.19054031372070312, 0.1949462890625]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 5.0, 7.0, 18.0, 34.0, 75.0, 116.0, 200.0, 188.0, 171.0, 103.0, 56.0, 12.0, 9.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.9666217565536499, -0.9421549439430237, -0.9176881909370422, -0.893221378326416, -0.8687546253204346, -0.8442878127098083, -0.8198210000991821, -0.7953542470932007, -0.7708874344825745, -0.7464206218719482, -0.7219538688659668, -0.6974870562553406, -0.6730203032493591, -0.6485534906387329, -0.6240867376327515, -0.5996199250221252, -0.575153112411499, -0.5506862998008728, -0.5262195467948914, -0.5017527341842651, -0.4772859513759613, -0.45281916856765747, -0.42835238575935364, -0.4038856029510498, -0.37941884994506836, -0.3549520671367645, -0.3304852843284607, -0.3060184717178345, -0.28155168890953064, -0.2570849061012268, -0.23261812329292297, -0.20815132558345795, -0.18368452787399292, -0.1592177450656891, -0.13475094735622406, -0.11028416454792023, -0.0858173742890358, -0.06135058403015137, -0.036883801221847534, -0.012417003512382507, 0.012049779295921326, 0.036516569554805756, 0.06098335608839989, 0.08545014262199402, 0.10991693288087845, 0.13438372313976288, 0.1588505059480667, 0.18331730365753174, 0.20778408646583557, 0.2322508692741394, 0.25671765208244324, 0.28118443489074707, 0.3056512475013733, 0.3301180303096771, 0.35458481311798096, 0.3790516257286072, 0.4035183787345886, 0.42798516154289246, 0.4524519443511963, 0.4769187569618225, 0.501385509967804, 0.5258523225784302, 0.5503190755844116, 0.5747858881950378, 0.5992527008056641]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 2.0, 5.0, 3.0, 5.0, 3.0, 6.0, 13.0, 21.0, 15.0, 29.0, 24.0, 24.0, 28.0, 22.0, 23.0, 35.0, 55.0, 41.0, 40.0, 55.0, 64.0, 34.0, 54.0, 47.0, 55.0, 42.0, 42.0, 35.0, 30.0, 32.0, 21.0, 24.0, 15.0, 13.0, 9.0, 12.0, 5.0, 4.0, 10.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.29025834798812866, -0.28041642904281616, -0.27057451009750366, -0.26073259115219116, -0.25089070200920105, -0.24104878306388855, -0.23120686411857605, -0.22136494517326355, -0.21152302622795105, -0.20168110728263855, -0.19183920323848724, -0.18199728429317474, -0.17215536534786224, -0.16231346130371094, -0.15247154235839844, -0.14262962341308594, -0.13278771936893463, -0.12294580787420273, -0.11310388892889023, -0.10326197743415833, -0.09342005848884583, -0.08357814699411392, -0.07373623549938202, -0.06389431655406952, -0.054052405059337616, -0.044210489839315414, -0.03436857461929321, -0.02452666312456131, -0.014684747904539108, -0.004842832684516907, 0.004999078810214996, 0.014840997755527496, 0.0246829092502594, 0.0345248244702816, 0.0443667396903038, 0.054208651185035706, 0.0640505701303482, 0.07389248162508011, 0.08373439311981201, 0.09357631206512451, 0.10341822355985641, 0.11326013505458832, 0.12310205399990082, 0.13294395804405212, 0.14278587698936462, 0.15262779593467712, 0.16246971487998962, 0.17231163382530212, 0.18215353786945343, 0.19199545681476593, 0.20183736085891724, 0.21167927980422974, 0.22152119874954224, 0.23136311769485474, 0.24120502173900604, 0.25104695558547974, 0.26088884472846985, 0.27073076367378235, 0.28057268261909485, 0.29041457176208496, 0.30025649070739746, 0.31009840965270996, 0.31994032859802246, 0.32978224754333496, 0.33962416648864746]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 0.0, 3.0, 8.0, 11.0, 22.0, 24.0, 51.0, 95.0, 192.0, 567.0, 2326.0, 20232.0, 485038.0, 515061.0, 21550.0, 2376.0, 581.0, 187.0, 104.0, 41.0, 30.0, 16.0, 16.0, 5.0, 4.0, 5.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.75048828125, -0.7312507629394531, -0.7120132446289062, -0.6927757263183594, -0.6735382080078125, -0.6543006896972656, -0.6350631713867188, -0.6158256530761719, -0.596588134765625, -0.5773506164550781, -0.5581130981445312, -0.5388755798339844, -0.5196380615234375, -0.5004005432128906, -0.48116302490234375, -0.4619255065917969, -0.44268798828125, -0.4234504699707031, -0.40421295166015625, -0.3849754333496094, -0.3657379150390625, -0.3465003967285156, -0.32726287841796875, -0.3080253601074219, -0.288787841796875, -0.2695503234863281, -0.25031280517578125, -0.23107528686523438, -0.2118377685546875, -0.19260025024414062, -0.17336273193359375, -0.15412521362304688, -0.1348876953125, -0.11565017700195312, -0.09641265869140625, -0.07717514038085938, -0.0579376220703125, -0.038700103759765625, -0.01946258544921875, -0.000225067138671875, 0.019012451171875, 0.038249969482421875, 0.05748748779296875, 0.07672500610351562, 0.0959625244140625, 0.11520004272460938, 0.13443756103515625, 0.15367507934570312, 0.17291259765625, 0.19215011596679688, 0.21138763427734375, 0.23062515258789062, 0.2498626708984375, 0.2691001892089844, 0.28833770751953125, 0.3075752258300781, 0.326812744140625, 0.3460502624511719, 0.36528778076171875, 0.3845252990722656, 0.4037628173828125, 0.4230003356933594, 0.44223785400390625, 0.4614753723144531, 0.480712890625]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 3.0, 4.0, 14.0, 14.0, 19.0, 25.0, 54.0, 47.0, 52.0, 80.0, 86.0, 60.0, 84.0, 73.0, 80.0, 71.0, 50.0, 45.0, 50.0, 22.0, 18.0, 17.0, 8.0, 10.0, 6.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.177490234375, -0.17122268676757812, -0.16495513916015625, -0.15868759155273438, -0.1524200439453125, -0.14615249633789062, -0.13988494873046875, -0.13361740112304688, -0.127349853515625, -0.12108230590820312, -0.11481475830078125, -0.10854721069335938, -0.1022796630859375, -0.09601211547851562, -0.08974456787109375, -0.08347702026367188, -0.07720947265625, -0.07094192504882812, -0.06467437744140625, -0.058406829833984375, -0.0521392822265625, -0.045871734619140625, -0.03960418701171875, -0.033336639404296875, -0.027069091796875, -0.020801544189453125, -0.01453399658203125, -0.008266448974609375, -0.0019989013671875, 0.004268646240234375, 0.01053619384765625, 0.016803741455078125, 0.0230712890625, 0.029338836669921875, 0.03560638427734375, 0.041873931884765625, 0.0481414794921875, 0.054409027099609375, 0.06067657470703125, 0.06694412231445312, 0.073211669921875, 0.07947921752929688, 0.08574676513671875, 0.09201431274414062, 0.0982818603515625, 0.10454940795898438, 0.11081695556640625, 0.11708450317382812, 0.12335205078125, 0.12961959838867188, 0.13588714599609375, 0.14215469360351562, 0.1484222412109375, 0.15468978881835938, 0.16095733642578125, 0.16722488403320312, 0.173492431640625, 0.17975997924804688, 0.18602752685546875, 0.19229507446289062, 0.1985626220703125, 0.20483016967773438, 0.21109771728515625, 0.21736526489257812, 0.2236328125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 2.0, 3.0, 3.0, 10.0, 8.0, 11.0, 19.0, 27.0, 32.0, 64.0, 89.0, 164.0, 281.0, 592.0, 1651.0, 7942.0, 163100.0, 834160.0, 34853.0, 3478.0, 1004.0, 425.0, 273.0, 123.0, 84.0, 42.0, 28.0, 23.0, 20.0, 14.0, 5.0, 7.0, 8.0, 1.0, 3.0, 1.0, 4.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.61328125, -0.5948562622070312, -0.5764312744140625, -0.5580062866210938, -0.539581298828125, -0.5211563110351562, -0.5027313232421875, -0.48430633544921875, -0.46588134765625, -0.44745635986328125, -0.4290313720703125, -0.41060638427734375, -0.392181396484375, -0.37375640869140625, -0.3553314208984375, -0.33690643310546875, -0.3184814453125, -0.30005645751953125, -0.2816314697265625, -0.26320648193359375, -0.244781494140625, -0.22635650634765625, -0.2079315185546875, -0.18950653076171875, -0.17108154296875, -0.15265655517578125, -0.1342315673828125, -0.11580657958984375, -0.097381591796875, -0.07895660400390625, -0.0605316162109375, -0.04210662841796875, -0.023681640625, -0.00525665283203125, 0.0131683349609375, 0.03159332275390625, 0.050018310546875, 0.06844329833984375, 0.0868682861328125, 0.10529327392578125, 0.12371826171875, 0.14214324951171875, 0.1605682373046875, 0.17899322509765625, 0.197418212890625, 0.21584320068359375, 0.2342681884765625, 0.25269317626953125, 0.2711181640625, 0.28954315185546875, 0.3079681396484375, 0.32639312744140625, 0.344818115234375, 0.36324310302734375, 0.3816680908203125, 0.40009307861328125, 0.41851806640625, 0.43694305419921875, 0.4553680419921875, 0.47379302978515625, 0.492218017578125, 0.5106430053710938, 0.5290679931640625, 0.5474929809570312, 0.56591796875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 5.0, 7.0, 6.0, 6.0, 5.0, 11.0, 8.0, 15.0, 16.0, 24.0, 24.0, 17.0, 26.0, 23.0, 29.0, 55.0, 21.0, 53.0, 38.0, 30.0, 59.0, 43.0, 43.0, 44.0, 39.0, 48.0, 34.0, 41.0, 37.0, 24.0, 34.0, 25.0, 23.0, 13.0, 9.0, 13.0, 12.0, 1.0, 11.0, 6.0, 10.0, 8.0, 4.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.42138671875, -0.4075660705566406, -0.39374542236328125, -0.3799247741699219, -0.3661041259765625, -0.3522834777832031, -0.33846282958984375, -0.3246421813964844, -0.310821533203125, -0.2970008850097656, -0.28318023681640625, -0.2693595886230469, -0.2555389404296875, -0.24171829223632812, -0.22789764404296875, -0.21407699584960938, -0.20025634765625, -0.18643569946289062, -0.17261505126953125, -0.15879440307617188, -0.1449737548828125, -0.13115310668945312, -0.11733245849609375, -0.10351181030273438, -0.089691162109375, -0.07587051391601562, -0.06204986572265625, -0.048229217529296875, -0.0344085693359375, -0.020587921142578125, -0.00676727294921875, 0.007053375244140625, 0.0208740234375, 0.034694671630859375, 0.04851531982421875, 0.062335968017578125, 0.0761566162109375, 0.08997726440429688, 0.10379791259765625, 0.11761856079101562, 0.131439208984375, 0.14525985717773438, 0.15908050537109375, 0.17290115356445312, 0.1867218017578125, 0.20054244995117188, 0.21436309814453125, 0.22818374633789062, 0.24200439453125, 0.2558250427246094, 0.26964569091796875, 0.2834663391113281, 0.2972869873046875, 0.3111076354980469, 0.32492828369140625, 0.3387489318847656, 0.352569580078125, 0.3663902282714844, 0.38021087646484375, 0.3940315246582031, 0.4078521728515625, 0.4216728210449219, 0.43549346923828125, 0.4493141174316406, 0.463134765625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 4.0, 3.0, 8.0, 4.0, 5.0, 14.0, 27.0, 43.0, 63.0, 112.0, 234.0, 604.0, 1429.0, 5354.0, 36944.0, 678273.0, 300611.0, 19233.0, 3604.0, 1085.0, 453.0, 195.0, 101.0, 54.0, 39.0, 24.0, 10.0, 5.0, 4.0, 4.0, 4.0, 6.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1475830078125, -0.1420879364013672, -0.13659286499023438, -0.13109779357910156, -0.12560272216796875, -0.12010765075683594, -0.11461257934570312, -0.10911750793457031, -0.1036224365234375, -0.09812736511230469, -0.09263229370117188, -0.08713722229003906, -0.08164215087890625, -0.07614707946777344, -0.07065200805664062, -0.06515693664550781, -0.059661865234375, -0.05416679382324219, -0.048671722412109375, -0.04317665100097656, -0.03768157958984375, -0.03218650817871094, -0.026691436767578125, -0.021196365356445312, -0.0157012939453125, -0.010206222534179688, -0.004711151123046875, 0.0007839202880859375, 0.00627899169921875, 0.011774063110351562, 0.017269134521484375, 0.022764205932617188, 0.02825927734375, 0.03375434875488281, 0.039249420166015625, 0.04474449157714844, 0.05023956298828125, 0.05573463439941406, 0.061229705810546875, 0.06672477722167969, 0.0722198486328125, 0.07771492004394531, 0.08320999145507812, 0.08870506286621094, 0.09420013427734375, 0.09969520568847656, 0.10519027709960938, 0.11068534851074219, 0.116180419921875, 0.12167549133300781, 0.12717056274414062, 0.13266563415527344, 0.13816070556640625, 0.14365577697753906, 0.14915084838867188, 0.1546459197998047, 0.1601409912109375, 0.1656360626220703, 0.17113113403320312, 0.17662620544433594, 0.18212127685546875, 0.18761634826660156, 0.19311141967773438, 0.1986064910888672, 0.2041015625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 3.0, 0.0, 4.0, 7.0, 6.0, 8.0, 6.0, 12.0, 6.0, 10.0, 12.0, 18.0, 15.0, 23.0, 22.0, 20.0, 39.0, 35.0, 46.0, 52.0, 73.0, 109.0, 100.0, 75.0, 46.0, 44.0, 34.0, 21.0, 27.0, 19.0, 16.0, 17.0, 14.0, 7.0, 9.0, 10.0, 8.0, 4.0, 4.0, 5.0, 7.0, 3.0, 4.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0], "bins": [-5.561113357543945e-05, -5.4006464779376984e-05, -5.2401795983314514e-05, -5.0797127187252045e-05, -4.9192458391189575e-05, -4.7587789595127106e-05, -4.5983120799064636e-05, -4.437845200300217e-05, -4.27737832069397e-05, -4.116911441087723e-05, -3.956444561481476e-05, -3.795977681875229e-05, -3.635510802268982e-05, -3.475043922662735e-05, -3.314577043056488e-05, -3.154110163450241e-05, -2.993643283843994e-05, -2.8331764042377472e-05, -2.6727095246315002e-05, -2.5122426450252533e-05, -2.3517757654190063e-05, -2.1913088858127594e-05, -2.0308420062065125e-05, -1.8703751266002655e-05, -1.7099082469940186e-05, -1.5494413673877716e-05, -1.3889744877815247e-05, -1.2285076081752777e-05, -1.0680407285690308e-05, -9.075738489627838e-06, -7.471069693565369e-06, -5.866400897502899e-06, -4.26173210144043e-06, -2.65706330537796e-06, -1.0523945093154907e-06, 5.522742867469788e-07, 2.1569430828094482e-06, 3.7616118788719177e-06, 5.366280674934387e-06, 6.970949470996857e-06, 8.575618267059326e-06, 1.0180287063121796e-05, 1.1784955859184265e-05, 1.3389624655246735e-05, 1.4994293451309204e-05, 1.6598962247371674e-05, 1.8203631043434143e-05, 1.9808299839496613e-05, 2.1412968635559082e-05, 2.301763743162155e-05, 2.462230622768402e-05, 2.622697502374649e-05, 2.783164381980896e-05, 2.943631261587143e-05, 3.10409814119339e-05, 3.264565020799637e-05, 3.425031900405884e-05, 3.585498780012131e-05, 3.745965659618378e-05, 3.9064325392246246e-05, 4.0668994188308716e-05, 4.2273662984371185e-05, 4.3878331780433655e-05, 4.5483000576496124e-05, 4.7087669372558594e-05]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 2.0, 10.0, 21.0, 50.0, 107.0, 249.0, 898.0, 4796.0, 147481.0, 875938.0, 16598.0, 1690.0, 427.0, 176.0, 60.0, 28.0, 11.0, 8.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26806640625, -0.2585716247558594, -0.24907684326171875, -0.23958206176757812, -0.2300872802734375, -0.22059249877929688, -0.21109771728515625, -0.20160293579101562, -0.192108154296875, -0.18261337280273438, -0.17311859130859375, -0.16362380981445312, -0.1541290283203125, -0.14463424682617188, -0.13513946533203125, -0.12564468383789062, -0.11614990234375, -0.10665512084960938, -0.09716033935546875, -0.08766555786132812, -0.0781707763671875, -0.06867599487304688, -0.05918121337890625, -0.049686431884765625, -0.040191650390625, -0.030696868896484375, -0.02120208740234375, -0.011707305908203125, -0.0022125244140625, 0.007282257080078125, 0.01677703857421875, 0.026271820068359375, 0.0357666015625, 0.045261383056640625, 0.05475616455078125, 0.06425094604492188, 0.0737457275390625, 0.08324050903320312, 0.09273529052734375, 0.10223007202148438, 0.111724853515625, 0.12121963500976562, 0.13071441650390625, 0.14020919799804688, 0.1497039794921875, 0.15919876098632812, 0.16869354248046875, 0.17818832397460938, 0.18768310546875, 0.19717788696289062, 0.20667266845703125, 0.21616744995117188, 0.2256622314453125, 0.23515701293945312, 0.24465179443359375, 0.2541465759277344, 0.263641357421875, 0.2731361389160156, 0.28263092041015625, 0.2921257019042969, 0.3016204833984375, 0.3111152648925781, 0.32061004638671875, 0.3301048278808594, 0.339599609375]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 10.0, 10.0, 7.0, 10.0, 18.0, 33.0, 31.0, 59.0, 69.0, 112.0, 122.0, 124.0, 108.0, 82.0, 68.0, 49.0, 28.0, 23.0, 13.0, 13.0, 4.0, 5.0, 4.0, 0.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1805419921875, -0.17526817321777344, -0.16999435424804688, -0.1647205352783203, -0.15944671630859375, -0.1541728973388672, -0.14889907836914062, -0.14362525939941406, -0.1383514404296875, -0.13307762145996094, -0.12780380249023438, -0.12252998352050781, -0.11725616455078125, -0.11198234558105469, -0.10670852661132812, -0.10143470764160156, -0.096160888671875, -0.09088706970214844, -0.08561325073242188, -0.08033943176269531, -0.07506561279296875, -0.06979179382324219, -0.06451797485351562, -0.05924415588378906, -0.0539703369140625, -0.04869651794433594, -0.043422698974609375, -0.03814888000488281, -0.03287506103515625, -0.027601242065429688, -0.022327423095703125, -0.017053604125976562, -0.01177978515625, -0.0065059661865234375, -0.001232147216796875, 0.0040416717529296875, 0.00931549072265625, 0.014589309692382812, 0.019863128662109375, 0.025136947631835938, 0.0304107666015625, 0.03568458557128906, 0.040958404541015625, 0.04623222351074219, 0.05150604248046875, 0.05677986145019531, 0.062053680419921875, 0.06732749938964844, 0.072601318359375, 0.07787513732910156, 0.08314895629882812, 0.08842277526855469, 0.09369659423828125, 0.09897041320800781, 0.10424423217773438, 0.10951805114746094, 0.1147918701171875, 0.12006568908691406, 0.12533950805664062, 0.1306133270263672, 0.13588714599609375, 0.1411609649658203, 0.14643478393554688, 0.15170860290527344, 0.156982421875]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 5.0, 17.0, 80.0, 291.0, 411.0, 176.0, 23.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.352109670639038, -1.1346243619918823, -0.9171390533447266, -0.699653685092926, -0.48216837644577026, -0.2646830081939697, -0.047197699546813965, 0.1702876091003418, 0.38777291774749756, 0.6052582263946533, 0.8227435350418091, 1.0402288436889648, 1.2577142715454102, 1.475199580192566, 1.6926848888397217, 1.9101701974868774, 2.127655506134033, 2.3451409339904785, 2.5626261234283447, 2.78011155128479, 2.9975967407226562, 3.2150821685791016, 3.432567596435547, 3.650052785873413, 3.8675379753112793, 4.085023403167725, 4.30250883102417, 4.519993782043457, 4.737479209899902, 4.954964637756348, 5.172450065612793, 5.389935493469238, 5.607420444488525, 5.824905872344971, 6.042391300201416, 6.259876251220703, 6.477361679077148, 6.694847106933594, 6.912332534790039, 7.129817962646484, 7.3473029136657715, 7.564788341522217, 7.782273769378662, 7.999758720397949, 8.217244148254395, 8.43472957611084, 8.652215003967285, 8.86970043182373, 9.087185859680176, 9.304671287536621, 9.522156715393066, 9.739642143249512, 9.957127571105957, 10.174612045288086, 10.392097473144531, 10.609582901000977, 10.827068328857422, 11.044553756713867, 11.262039184570312, 11.479524612426758, 11.697010040283203, 11.914495468139648, 12.131979942321777, 12.349465370178223, 12.566950798034668]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 5.0, 5.0, 6.0, 5.0, 9.0, 10.0, 12.0, 21.0, 14.0, 17.0, 29.0, 31.0, 34.0, 27.0, 42.0, 37.0, 44.0, 69.0, 62.0, 67.0, 53.0, 49.0, 56.0, 34.0, 38.0, 34.0, 44.0, 35.0, 23.0, 23.0, 15.0, 18.0, 11.0, 8.0, 11.0, 7.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0299534797668457, -1.9568727016448975, -1.8837920427322388, -1.8107112646102905, -1.7376306056976318, -1.6645498275756836, -1.5914690494537354, -1.5183883905410767, -1.445307731628418, -1.3722269535064697, -1.299146294593811, -1.2260655164718628, -1.152984857559204, -1.0799040794372559, -1.0068233013153076, -0.9337426424026489, -0.8606618642807007, -0.7875811457633972, -0.7145004272460938, -0.6414196491241455, -0.5683389902114868, -0.49525824189186096, -0.4221774935722351, -0.34909677505493164, -0.2760160565376282, -0.2029353380203247, -0.12985460460186005, -0.056773871183395386, 0.01630684733390808, 0.08938756585121155, 0.1624683141708374, 0.23554903268814087, 0.30862975120544434, 0.3817104697227478, 0.45479118824005127, 0.5278719663619995, 0.6009526252746582, 0.6740334033966064, 0.7471141219139099, 0.8201948404312134, 0.8932755589485168, 0.9663562774658203, 1.0394370555877686, 1.1125177145004272, 1.1855984926223755, 1.2586791515350342, 1.3317599296569824, 1.4048407077789307, 1.4779213666915894, 1.5510021448135376, 1.6240828037261963, 1.6971635818481445, 1.7702442407608032, 1.8433250188827515, 1.9164056777954102, 1.9894864559173584, 2.0625672340393066, 2.135648012161255, 2.208728790283203, 2.2818093299865723, 2.3548901081085205, 2.4279708862304688, 2.501051664352417, 2.5741324424743652, 2.6472129821777344]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 7.0, 10.0, 8.0, 12.0, 11.0, 20.0, 26.0, 39.0, 47.0, 88.0, 162.0, 261.0, 552.0, 1427.0, 4671.0, 29211.0, 1106717.0, 2985625.0, 55079.0, 6950.0, 1902.0, 652.0, 312.0, 174.0, 90.0, 59.0, 41.0, 31.0, 19.0, 18.0, 15.0, 6.0, 13.0, 3.0, 6.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.341064453125, -0.3310699462890625, -0.321075439453125, -0.3110809326171875, -0.30108642578125, -0.2910919189453125, -0.281097412109375, -0.2711029052734375, -0.2611083984375, -0.2511138916015625, -0.241119384765625, -0.2311248779296875, -0.22113037109375, -0.2111358642578125, -0.201141357421875, -0.1911468505859375, -0.18115234375, -0.1711578369140625, -0.161163330078125, -0.1511688232421875, -0.14117431640625, -0.1311798095703125, -0.121185302734375, -0.1111907958984375, -0.1011962890625, -0.0912017822265625, -0.081207275390625, -0.0712127685546875, -0.06121826171875, -0.0512237548828125, -0.041229248046875, -0.0312347412109375, -0.021240234375, -0.0112457275390625, -0.001251220703125, 0.0087432861328125, 0.01873779296875, 0.0287322998046875, 0.038726806640625, 0.0487213134765625, 0.0587158203125, 0.0687103271484375, 0.078704833984375, 0.0886993408203125, 0.09869384765625, 0.1086883544921875, 0.118682861328125, 0.1286773681640625, 0.138671875, 0.1486663818359375, 0.158660888671875, 0.1686553955078125, 0.17864990234375, 0.1886444091796875, 0.198638916015625, 0.2086334228515625, 0.2186279296875, 0.2286224365234375, 0.238616943359375, 0.2486114501953125, 0.25860595703125, 0.2686004638671875, 0.278594970703125, 0.2885894775390625, 0.298583984375]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 4.0, 2.0, 7.0, 10.0, 15.0, 15.0, 20.0, 37.0, 41.0, 66.0, 95.0, 86.0, 85.0, 85.0, 84.0, 84.0, 62.0, 53.0, 42.0, 40.0, 21.0, 20.0, 8.0, 12.0, 7.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.169921875, -0.16370010375976562, -0.15747833251953125, -0.15125656127929688, -0.1450347900390625, -0.13881301879882812, -0.13259124755859375, -0.12636947631835938, -0.120147705078125, -0.11392593383789062, -0.10770416259765625, -0.10148239135742188, -0.0952606201171875, -0.08903884887695312, -0.08281707763671875, -0.07659530639648438, -0.07037353515625, -0.06415176391601562, -0.05792999267578125, -0.051708221435546875, -0.0454864501953125, -0.039264678955078125, -0.03304290771484375, -0.026821136474609375, -0.020599365234375, -0.014377593994140625, -0.00815582275390625, -0.001934051513671875, 0.0042877197265625, 0.010509490966796875, 0.01673126220703125, 0.022953033447265625, 0.0291748046875, 0.035396575927734375, 0.04161834716796875, 0.047840118408203125, 0.0540618896484375, 0.060283660888671875, 0.06650543212890625, 0.07272720336914062, 0.078948974609375, 0.08517074584960938, 0.09139251708984375, 0.09761428833007812, 0.1038360595703125, 0.11005783081054688, 0.11627960205078125, 0.12250137329101562, 0.12872314453125, 0.13494491577148438, 0.14116668701171875, 0.14738845825195312, 0.1536102294921875, 0.15983200073242188, 0.16605377197265625, 0.17227554321289062, 0.178497314453125, 0.18471908569335938, 0.19094085693359375, 0.19716262817382812, 0.2033843994140625, 0.20960617065429688, 0.21582794189453125, 0.22204971313476562, 0.228271484375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 7.0, 9.0, 9.0, 16.0, 42.0, 67.0, 130.0, 335.0, 1123.0, 5400.0, 69653.0, 3988282.0, 120320.0, 6978.0, 1252.0, 351.0, 136.0, 70.0, 30.0, 26.0, 19.0, 7.0, 3.0, 7.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.408935546875, -0.3941001892089844, -0.37926483154296875, -0.3644294738769531, -0.3495941162109375, -0.3347587585449219, -0.31992340087890625, -0.3050880432128906, -0.290252685546875, -0.2754173278808594, -0.26058197021484375, -0.24574661254882812, -0.2309112548828125, -0.21607589721679688, -0.20124053955078125, -0.18640518188476562, -0.17156982421875, -0.15673446655273438, -0.14189910888671875, -0.12706375122070312, -0.1122283935546875, -0.09739303588867188, -0.08255767822265625, -0.06772232055664062, -0.052886962890625, -0.038051605224609375, -0.02321624755859375, -0.008380889892578125, 0.0064544677734375, 0.021289825439453125, 0.03612518310546875, 0.050960540771484375, 0.0657958984375, 0.08063125610351562, 0.09546661376953125, 0.11030197143554688, 0.1251373291015625, 0.13997268676757812, 0.15480804443359375, 0.16964340209960938, 0.184478759765625, 0.19931411743164062, 0.21414947509765625, 0.22898483276367188, 0.2438201904296875, 0.2586555480957031, 0.27349090576171875, 0.2883262634277344, 0.30316162109375, 0.3179969787597656, 0.33283233642578125, 0.3476676940917969, 0.3625030517578125, 0.3773384094238281, 0.39217376708984375, 0.4070091247558594, 0.421844482421875, 0.4366798400878906, 0.45151519775390625, 0.4663505554199219, 0.4811859130859375, 0.4960212707519531, 0.5108566284179688, 0.5256919860839844, 0.54052734375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 4.0, 1.0, 3.0, 2.0, 6.0, 9.0, 10.0, 9.0, 21.0, 29.0, 50.0, 85.0, 215.0, 530.0, 1074.0, 983.0, 510.0, 237.0, 133.0, 52.0, 39.0, 15.0, 18.0, 14.0, 6.0, 5.0, 5.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.356689453125, -0.34649658203125, -0.3363037109375, -0.32611083984375, -0.31591796875, -0.30572509765625, -0.2955322265625, -0.28533935546875, -0.275146484375, -0.26495361328125, -0.2547607421875, -0.24456787109375, -0.234375, -0.22418212890625, -0.2139892578125, -0.20379638671875, -0.193603515625, -0.18341064453125, -0.1732177734375, -0.16302490234375, -0.15283203125, -0.14263916015625, -0.1324462890625, -0.12225341796875, -0.112060546875, -0.10186767578125, -0.0916748046875, -0.08148193359375, -0.0712890625, -0.06109619140625, -0.0509033203125, -0.04071044921875, -0.030517578125, -0.02032470703125, -0.0101318359375, 6.103515625e-05, 0.01025390625, 0.02044677734375, 0.0306396484375, 0.04083251953125, 0.051025390625, 0.06121826171875, 0.0714111328125, 0.08160400390625, 0.091796875, 0.10198974609375, 0.1121826171875, 0.12237548828125, 0.132568359375, 0.14276123046875, 0.1529541015625, 0.16314697265625, 0.17333984375, 0.18353271484375, 0.1937255859375, 0.20391845703125, 0.214111328125, 0.22430419921875, 0.2344970703125, 0.24468994140625, 0.2548828125, 0.26507568359375, 0.2752685546875, 0.28546142578125, 0.295654296875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 8.0, 6.0, 9.0, 53.0, 123.0, 248.0, 275.0, 164.0, 69.0, 21.0, 17.0, 9.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.164518356323242, -3.0649330615997314, -2.9653477668762207, -2.86576247215271, -2.766177177429199, -2.6665918827056885, -2.5670065879821777, -2.467421293258667, -2.3678359985351562, -2.2682507038116455, -2.1686654090881348, -2.069080114364624, -1.9694948196411133, -1.8699095249176025, -1.7703242301940918, -1.670738935470581, -1.5711535215377808, -1.47156822681427, -1.3719829320907593, -1.2723976373672485, -1.1728123426437378, -1.073227047920227, -0.9736416935920715, -0.8740563988685608, -0.77447110414505, -0.6748858094215393, -0.5753005146980286, -0.47571519017219543, -0.3761298954486847, -0.27654460072517395, -0.17695927619934082, -0.07737398147583008, 0.022211313247680664, 0.121796615421772, 0.22138191759586334, 0.3209672272205353, 0.420552521944046, 0.5201377868652344, 0.6197231411933899, 0.7193084359169006, 0.8188937306404114, 0.9184790253639221, 1.0180643796920776, 1.1176496744155884, 1.2172349691390991, 1.3168202638626099, 1.4164055585861206, 1.5159908533096313, 1.615576148033142, 1.7151614427566528, 1.8147467374801636, 1.9143320322036743, 2.0139174461364746, 2.1135027408599854, 2.213088035583496, 2.312673330307007, 2.4122586250305176, 2.5118439197540283, 2.611429214477539, 2.71101450920105, 2.8105998039245605, 2.9101850986480713, 3.009770393371582, 3.1093556880950928, 3.2089409828186035]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 4.0, 4.0, 8.0, 11.0, 11.0, 12.0, 21.0, 20.0, 16.0, 34.0, 26.0, 29.0, 35.0, 44.0, 46.0, 39.0, 38.0, 60.0, 44.0, 61.0, 50.0, 44.0, 39.0, 33.0, 46.0, 29.0, 30.0, 33.0, 18.0, 23.0, 11.0, 13.0, 19.0, 13.0, 8.0, 8.0, 6.0, 10.0, 5.0, 0.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0129623413085938, -0.9760415554046631, -0.9391207098960876, -0.902199923992157, -0.8652790784835815, -0.8283582925796509, -0.7914375066757202, -0.7545167207717896, -0.7175958752632141, -0.6806750893592834, -0.643754243850708, -0.6068334579467773, -0.5699126720428467, -0.5329918265342712, -0.4960710406303406, -0.4591502249240875, -0.4222294092178345, -0.3853085935115814, -0.34838777780532837, -0.3114669919013977, -0.27454617619514465, -0.2376253604888916, -0.20070455968379974, -0.16378375887870789, -0.12686294317245483, -0.08994213491678238, -0.053021326661109924, -0.01610051840543747, 0.020820289850234985, 0.05774110555648804, 0.0946619063615799, 0.13158270716667175, 0.1685035228729248, 0.20542433857917786, 0.24234513938426971, 0.2792659401893616, 0.3161867558956146, 0.3531075716018677, 0.39002835750579834, 0.4269491732120514, 0.46386998891830444, 0.5007907748222351, 0.5377116203308105, 0.5746324062347412, 0.6115531921386719, 0.6484740376472473, 0.685394823551178, 0.7223156690597534, 0.7592364549636841, 0.7961572408676147, 0.8330780863761902, 0.8699988722801208, 0.9069197177886963, 0.943840503692627, 0.9807612895965576, 1.0176820755004883, 1.054602861404419, 1.0915236473083496, 1.1284444332122803, 1.1653653383255005, 1.2022861242294312, 1.2392069101333618, 1.2761276960372925, 1.3130484819412231, 1.3499693870544434]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 0.0, 2.0, 6.0, 5.0, 9.0, 11.0, 18.0, 19.0, 35.0, 43.0, 47.0, 85.0, 130.0, 222.0, 384.0, 589.0, 1095.0, 2034.0, 3968.0, 8315.0, 18804.0, 47345.0, 128569.0, 343049.0, 308623.0, 111536.0, 41322.0, 16861.0, 7442.0, 3724.0, 1812.0, 973.0, 539.0, 331.0, 237.0, 114.0, 93.0, 46.0, 33.0, 25.0, 19.0, 14.0, 7.0, 11.0, 6.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1553955078125, -0.15037155151367188, -0.14534759521484375, -0.14032363891601562, -0.1352996826171875, -0.13027572631835938, -0.12525177001953125, -0.12022781372070312, -0.115203857421875, -0.11017990112304688, -0.10515594482421875, -0.10013198852539062, -0.0951080322265625, -0.09008407592773438, -0.08506011962890625, -0.08003616333007812, -0.07501220703125, -0.06998825073242188, -0.06496429443359375, -0.059940338134765625, -0.0549163818359375, -0.049892425537109375, -0.04486846923828125, -0.039844512939453125, -0.034820556640625, -0.029796600341796875, -0.02477264404296875, -0.019748687744140625, -0.0147247314453125, -0.009700775146484375, -0.00467681884765625, 0.000347137451171875, 0.00537109375, 0.010395050048828125, 0.01541900634765625, 0.020442962646484375, 0.0254669189453125, 0.030490875244140625, 0.03551483154296875, 0.040538787841796875, 0.045562744140625, 0.050586700439453125, 0.05561065673828125, 0.060634613037109375, 0.0656585693359375, 0.07068252563476562, 0.07570648193359375, 0.08073043823242188, 0.08575439453125, 0.09077835083007812, 0.09580230712890625, 0.10082626342773438, 0.1058502197265625, 0.11087417602539062, 0.11589813232421875, 0.12092208862304688, 0.125946044921875, 0.13097000122070312, 0.13599395751953125, 0.14101791381835938, 0.1460418701171875, 0.15106582641601562, 0.15608978271484375, 0.16111373901367188, 0.1661376953125]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 3.0, 2.0, 3.0, 7.0, 12.0, 24.0, 17.0, 31.0, 41.0, 57.0, 71.0, 99.0, 105.0, 90.0, 81.0, 74.0, 66.0, 56.0, 50.0, 39.0, 22.0, 18.0, 10.0, 14.0, 6.0, 7.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.178955078125, -0.17268753051757812, -0.16641998291015625, -0.16015243530273438, -0.1538848876953125, -0.14761734008789062, -0.14134979248046875, -0.13508224487304688, -0.128814697265625, -0.12254714965820312, -0.11627960205078125, -0.11001205444335938, -0.1037445068359375, -0.09747695922851562, -0.09120941162109375, -0.08494186401367188, -0.07867431640625, -0.07240676879882812, -0.06613922119140625, -0.059871673583984375, -0.0536041259765625, -0.047336578369140625, -0.04106903076171875, -0.034801483154296875, -0.028533935546875, -0.022266387939453125, -0.01599884033203125, -0.009731292724609375, -0.0034637451171875, 0.002803802490234375, 0.00907135009765625, 0.015338897705078125, 0.0216064453125, 0.027873992919921875, 0.03414154052734375, 0.040409088134765625, 0.0466766357421875, 0.052944183349609375, 0.05921173095703125, 0.06547927856445312, 0.071746826171875, 0.07801437377929688, 0.08428192138671875, 0.09054946899414062, 0.0968170166015625, 0.10308456420898438, 0.10935211181640625, 0.11561965942382812, 0.12188720703125, 0.12815475463867188, 0.13442230224609375, 0.14068984985351562, 0.1469573974609375, 0.15322494506835938, 0.15949249267578125, 0.16576004028320312, 0.172027587890625, 0.17829513549804688, 0.18456268310546875, 0.19083023071289062, 0.1970977783203125, 0.20336532592773438, 0.20963287353515625, 0.21590042114257812, 0.22216796875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 6.0, 12.0, 5.0, 6.0, 16.0, 20.0, 25.0, 37.0, 71.0, 133.0, 243.0, 416.0, 757.0, 1864.0, 7165.0, 100265.0, 867009.0, 61758.0, 5573.0, 1626.0, 689.0, 343.0, 177.0, 117.0, 84.0, 47.0, 37.0, 21.0, 8.0, 6.0, 8.0, 3.0, 5.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.394287109375, -0.3787803649902344, -0.36327362060546875, -0.3477668762207031, -0.3322601318359375, -0.3167533874511719, -0.30124664306640625, -0.2857398986816406, -0.270233154296875, -0.2547264099121094, -0.23921966552734375, -0.22371292114257812, -0.2082061767578125, -0.19269943237304688, -0.17719268798828125, -0.16168594360351562, -0.14617919921875, -0.13067245483398438, -0.11516571044921875, -0.09965896606445312, -0.0841522216796875, -0.06864547729492188, -0.05313873291015625, -0.037631988525390625, -0.022125244140625, -0.006618499755859375, 0.00888824462890625, 0.024394989013671875, 0.0399017333984375, 0.055408477783203125, 0.07091522216796875, 0.08642196655273438, 0.1019287109375, 0.11743545532226562, 0.13294219970703125, 0.14844894409179688, 0.1639556884765625, 0.17946243286132812, 0.19496917724609375, 0.21047592163085938, 0.225982666015625, 0.24148941040039062, 0.25699615478515625, 0.2725028991699219, 0.2880096435546875, 0.3035163879394531, 0.31902313232421875, 0.3345298767089844, 0.35003662109375, 0.3655433654785156, 0.38105010986328125, 0.3965568542480469, 0.4120635986328125, 0.4275703430175781, 0.44307708740234375, 0.4585838317871094, 0.474090576171875, 0.4895973205566406, 0.5051040649414062, 0.5206108093261719, 0.5361175537109375, 0.5516242980957031, 0.5671310424804688, 0.5826377868652344, 0.59814453125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 7.0, 3.0, 4.0, 3.0, 10.0, 11.0, 7.0, 8.0, 17.0, 14.0, 19.0, 25.0, 26.0, 23.0, 13.0, 36.0, 29.0, 38.0, 39.0, 44.0, 39.0, 46.0, 34.0, 42.0, 47.0, 42.0, 32.0, 38.0, 28.0, 37.0, 29.0, 32.0, 28.0, 27.0, 16.0, 30.0, 16.0, 14.0, 15.0, 14.0, 4.0, 4.0, 6.0, 2.0, 5.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.369384765625, -0.35717010498046875, -0.3449554443359375, -0.33274078369140625, -0.320526123046875, -0.30831146240234375, -0.2960968017578125, -0.28388214111328125, -0.27166748046875, -0.25945281982421875, -0.2472381591796875, -0.23502349853515625, -0.222808837890625, -0.21059417724609375, -0.1983795166015625, -0.18616485595703125, -0.1739501953125, -0.16173553466796875, -0.1495208740234375, -0.13730621337890625, -0.125091552734375, -0.11287689208984375, -0.1006622314453125, -0.08844757080078125, -0.07623291015625, -0.06401824951171875, -0.0518035888671875, -0.03958892822265625, -0.027374267578125, -0.01515960693359375, -0.0029449462890625, 0.00926971435546875, 0.021484375, 0.03369903564453125, 0.0459136962890625, 0.05812835693359375, 0.070343017578125, 0.08255767822265625, 0.0947723388671875, 0.10698699951171875, 0.11920166015625, 0.13141632080078125, 0.1436309814453125, 0.15584564208984375, 0.168060302734375, 0.18027496337890625, 0.1924896240234375, 0.20470428466796875, 0.2169189453125, 0.22913360595703125, 0.2413482666015625, 0.25356292724609375, 0.265777587890625, 0.27799224853515625, 0.2902069091796875, 0.30242156982421875, 0.31463623046875, 0.32685089111328125, 0.3390655517578125, 0.35128021240234375, 0.363494873046875, 0.37570953369140625, 0.3879241943359375, 0.40013885498046875, 0.412353515625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 4.0, 5.0, 11.0, 17.0, 19.0, 23.0, 46.0, 65.0, 117.0, 200.0, 355.0, 703.0, 1683.0, 5502.0, 27742.0, 341560.0, 622463.0, 37517.0, 6842.0, 1985.0, 768.0, 380.0, 192.0, 120.0, 61.0, 53.0, 31.0, 24.0, 16.0, 12.0, 11.0, 10.0, 5.0, 7.0, 2.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1373291015625, -0.1320629119873047, -0.12679672241210938, -0.12153053283691406, -0.11626434326171875, -0.11099815368652344, -0.10573196411132812, -0.10046577453613281, -0.0951995849609375, -0.08993339538574219, -0.08466720581054688, -0.07940101623535156, -0.07413482666015625, -0.06886863708496094, -0.06360244750976562, -0.05833625793457031, -0.053070068359375, -0.04780387878417969, -0.042537689208984375, -0.03727149963378906, -0.03200531005859375, -0.026739120483398438, -0.021472930908203125, -0.016206741333007812, -0.0109405517578125, -0.0056743621826171875, -0.000408172607421875, 0.0048580169677734375, 0.01012420654296875, 0.015390396118164062, 0.020656585693359375, 0.025922775268554688, 0.03118896484375, 0.03645515441894531, 0.041721343994140625, 0.04698753356933594, 0.05225372314453125, 0.05751991271972656, 0.06278610229492188, 0.06805229187011719, 0.0733184814453125, 0.07858467102050781, 0.08385086059570312, 0.08911705017089844, 0.09438323974609375, 0.09964942932128906, 0.10491561889648438, 0.11018180847167969, 0.115447998046875, 0.12071418762207031, 0.12598037719726562, 0.13124656677246094, 0.13651275634765625, 0.14177894592285156, 0.14704513549804688, 0.1523113250732422, 0.1575775146484375, 0.1628437042236328, 0.16810989379882812, 0.17337608337402344, 0.17864227294921875, 0.18390846252441406, 0.18917465209960938, 0.1944408416748047, 0.19970703125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 6.0, 2.0, 2.0, 6.0, 6.0, 10.0, 14.0, 13.0, 13.0, 22.0, 26.0, 24.0, 48.0, 52.0, 96.0, 133.0, 140.0, 115.0, 83.0, 45.0, 21.0, 21.0, 23.0, 15.0, 15.0, 16.0, 7.0, 8.0, 6.0, 5.0, 0.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.56382942199707e-05, -7.321685552597046e-05, -7.079541683197021e-05, -6.837397813796997e-05, -6.595253944396973e-05, -6.353110074996948e-05, -6.110966205596924e-05, -5.8688223361968994e-05, -5.626678466796875e-05, -5.3845345973968506e-05, -5.142390727996826e-05, -4.900246858596802e-05, -4.6581029891967773e-05, -4.415959119796753e-05, -4.1738152503967285e-05, -3.931671380996704e-05, -3.68952751159668e-05, -3.447383642196655e-05, -3.205239772796631e-05, -2.9630959033966064e-05, -2.720952033996582e-05, -2.4788081645965576e-05, -2.2366642951965332e-05, -1.9945204257965088e-05, -1.7523765563964844e-05, -1.51023268699646e-05, -1.2680888175964355e-05, -1.0259449481964111e-05, -7.838010787963867e-06, -5.416572093963623e-06, -2.995133399963379e-06, -5.736947059631348e-07, 1.8477439880371094e-06, 4.2691826820373535e-06, 6.690621376037598e-06, 9.112060070037842e-06, 1.1533498764038086e-05, 1.395493745803833e-05, 1.6376376152038574e-05, 1.879781484603882e-05, 2.1219253540039062e-05, 2.3640692234039307e-05, 2.606213092803955e-05, 2.8483569622039795e-05, 3.090500831604004e-05, 3.332644701004028e-05, 3.574788570404053e-05, 3.816932439804077e-05, 4.0590763092041016e-05, 4.301220178604126e-05, 4.5433640480041504e-05, 4.785507917404175e-05, 5.027651786804199e-05, 5.2697956562042236e-05, 5.511939525604248e-05, 5.7540833950042725e-05, 5.996227264404297e-05, 6.238371133804321e-05, 6.480515003204346e-05, 6.72265887260437e-05, 6.964802742004395e-05, 7.206946611404419e-05, 7.449090480804443e-05, 7.691234350204468e-05, 7.933378219604492e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 4.0, 7.0, 10.0, 16.0, 9.0, 31.0, 46.0, 69.0, 124.0, 184.0, 357.0, 672.0, 1428.0, 4067.0, 17987.0, 165732.0, 783128.0, 60329.0, 9501.0, 2652.0, 1010.0, 458.0, 310.0, 160.0, 94.0, 69.0, 25.0, 32.0, 18.0, 8.0, 9.0, 6.0, 2.0, 2.0, 5.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.24169921875, -0.23584747314453125, -0.2299957275390625, -0.22414398193359375, -0.218292236328125, -0.21244049072265625, -0.2065887451171875, -0.20073699951171875, -0.19488525390625, -0.18903350830078125, -0.1831817626953125, -0.17733001708984375, -0.171478271484375, -0.16562652587890625, -0.1597747802734375, -0.15392303466796875, -0.1480712890625, -0.14221954345703125, -0.1363677978515625, -0.13051605224609375, -0.124664306640625, -0.11881256103515625, -0.1129608154296875, -0.10710906982421875, -0.10125732421875, -0.09540557861328125, -0.0895538330078125, -0.08370208740234375, -0.077850341796875, -0.07199859619140625, -0.0661468505859375, -0.06029510498046875, -0.054443359375, -0.04859161376953125, -0.0427398681640625, -0.03688812255859375, -0.031036376953125, -0.02518463134765625, -0.0193328857421875, -0.01348114013671875, -0.00762939453125, -0.00177764892578125, 0.0040740966796875, 0.00992584228515625, 0.015777587890625, 0.02162933349609375, 0.0274810791015625, 0.03333282470703125, 0.0391845703125, 0.04503631591796875, 0.0508880615234375, 0.05673980712890625, 0.062591552734375, 0.06844329833984375, 0.0742950439453125, 0.08014678955078125, 0.08599853515625, 0.09185028076171875, 0.0977020263671875, 0.10355377197265625, 0.109405517578125, 0.11525726318359375, 0.1211090087890625, 0.12696075439453125, 0.1328125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 2.0, 4.0, 3.0, 2.0, 4.0, 11.0, 4.0, 7.0, 10.0, 14.0, 10.0, 24.0, 18.0, 17.0, 22.0, 38.0, 38.0, 43.0, 53.0, 44.0, 55.0, 66.0, 67.0, 60.0, 56.0, 50.0, 50.0, 40.0, 39.0, 29.0, 14.0, 21.0, 14.0, 4.0, 9.0, 6.0, 6.0, 12.0, 6.0, 5.0, 3.0, 5.0, 3.0, 3.0, 4.0, 1.0, 3.0, 1.0, 1.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08203125, -0.0791788101196289, -0.07632637023925781, -0.07347393035888672, -0.07062149047851562, -0.06776905059814453, -0.06491661071777344, -0.062064170837402344, -0.05921173095703125, -0.056359291076660156, -0.05350685119628906, -0.05065441131591797, -0.047801971435546875, -0.04494953155517578, -0.04209709167480469, -0.039244651794433594, -0.0363922119140625, -0.033539772033691406, -0.030687332153320312, -0.02783489227294922, -0.024982452392578125, -0.02213001251220703, -0.019277572631835938, -0.016425132751464844, -0.01357269287109375, -0.010720252990722656, -0.007867813110351562, -0.005015373229980469, -0.002162933349609375, 0.0006895065307617188, 0.0035419464111328125, 0.006394386291503906, 0.009246826171875, 0.012099266052246094, 0.014951705932617188, 0.01780414581298828, 0.020656585693359375, 0.02350902557373047, 0.026361465454101562, 0.029213905334472656, 0.03206634521484375, 0.034918785095214844, 0.03777122497558594, 0.04062366485595703, 0.043476104736328125, 0.04632854461669922, 0.04918098449707031, 0.052033424377441406, 0.0548858642578125, 0.057738304138183594, 0.06059074401855469, 0.06344318389892578, 0.06629562377929688, 0.06914806365966797, 0.07200050354003906, 0.07485294342041016, 0.07770538330078125, 0.08055782318115234, 0.08341026306152344, 0.08626270294189453, 0.08911514282226562, 0.09196758270263672, 0.09482002258300781, 0.0976724624633789, 0.10052490234375]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 21.0, 95.0, 283.0, 367.0, 164.0, 44.0, 15.0, 5.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.109798908233643, -4.955634593963623, -4.8014702796936035, -4.647306442260742, -4.493142127990723, -4.338977813720703, -4.184813499450684, -4.030649185180664, -3.8764853477478027, -3.722321033477783, -3.5681569576263428, -3.4139926433563232, -3.259828567504883, -3.1056642532348633, -2.9514999389648438, -2.7973358631134033, -2.643171548843384, -2.4890072345733643, -2.334843158721924, -2.1806788444519043, -2.026514768600464, -1.8723504543304443, -1.7181862592697144, -1.5640220642089844, -1.4098578691482544, -1.2556936740875244, -1.1015294790267944, -0.9473652243614197, -0.7932010293006897, -0.6390368342399597, -0.48487257957458496, -0.330708384513855, -0.176544189453125, -0.022379979491233826, 0.13178423047065735, 0.2859484553337097, 0.4401126503944397, 0.5942768454551697, 0.7484411001205444, 0.9026052951812744, 1.0567694902420044, 1.2109336853027344, 1.3650978803634644, 1.5192620754241943, 1.6734263896942139, 1.8275904655456543, 1.9817547798156738, 2.1359190940856934, 2.290083169937134, 2.4442474842071533, 2.5984115600585938, 2.7525758743286133, 2.9067399501800537, 3.0609042644500732, 3.2150683403015137, 3.369232654571533, 3.5233969688415527, 3.6775612831115723, 3.8317253589630127, 3.9858896732330322, 4.140053749084473, 4.294218063354492, 4.448382377624512, 4.602546691894531, 4.756710529327393]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 4.0, 3.0, 3.0, 6.0, 3.0, 9.0, 16.0, 12.0, 12.0, 10.0, 18.0, 25.0, 17.0, 31.0, 22.0, 29.0, 28.0, 25.0, 35.0, 30.0, 44.0, 53.0, 41.0, 37.0, 48.0, 46.0, 34.0, 35.0, 41.0, 32.0, 30.0, 32.0, 31.0, 22.0, 12.0, 29.0, 13.0, 15.0, 10.0, 17.0, 8.0, 7.0, 8.0, 4.0, 4.0, 2.0, 3.0, 0.0, 2.0, 5.0, 2.0, 1.0, 3.0, 3.0, 2.0], "bins": [-1.4520676136016846, -1.4080214500427246, -1.3639752864837646, -1.3199291229248047, -1.2758829593658447, -1.2318367958068848, -1.1877906322479248, -1.1437444686889648, -1.0996983051300049, -1.055652141571045, -1.011605978012085, -0.967559814453125, -0.923513650894165, -0.8794674873352051, -0.8354212641716003, -0.7913751006126404, -0.7473288774490356, -0.7032827138900757, -0.6592365503311157, -0.6151903867721558, -0.5711442232131958, -0.5270980596542358, -0.4830518364906311, -0.43900567293167114, -0.3949595093727112, -0.3509133458137512, -0.30686718225479126, -0.2628209888935089, -0.21877482533454895, -0.174728661775589, -0.13068246841430664, -0.08663630485534668, -0.04259002208709717, 0.00145614892244339, 0.04550231993198395, 0.0895484983921051, 0.13359466195106506, 0.17764082551002502, 0.22168701887130737, 0.26573318243026733, 0.3097793459892273, 0.35382550954818726, 0.3978716731071472, 0.44191786646842957, 0.4859640300273895, 0.5300102233886719, 0.5740563869476318, 0.6181025505065918, 0.6621487140655518, 0.7061948776245117, 0.7502410411834717, 0.7942872047424316, 0.8383333683013916, 0.8823795318603516, 0.9264257550239563, 0.9704719185829163, 1.0145180225372314, 1.0585641860961914, 1.1026103496551514, 1.1466565132141113, 1.1907026767730713, 1.2347488403320312, 1.2787950038909912, 1.3228411674499512, 1.3668874502182007]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 8.0, 6.0, 6.0, 10.0, 23.0, 21.0, 43.0, 60.0, 99.0, 138.0, 220.0, 418.0, 2251.0, 2331242.0, 1856715.0, 2007.0, 409.0, 201.0, 137.0, 90.0, 59.0, 37.0, 31.0, 21.0, 13.0, 3.0, 5.0, 2.0, 6.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.080078125, -1.0508804321289062, -1.0216827392578125, -0.9924850463867188, -0.963287353515625, -0.9340896606445312, -0.9048919677734375, -0.8756942749023438, -0.84649658203125, -0.8172988891601562, -0.7881011962890625, -0.7589035034179688, -0.729705810546875, -0.7005081176757812, -0.6713104248046875, -0.6421127319335938, -0.6129150390625, -0.5837173461914062, -0.5545196533203125, -0.5253219604492188, -0.496124267578125, -0.46692657470703125, -0.4377288818359375, -0.40853118896484375, -0.37933349609375, -0.35013580322265625, -0.3209381103515625, -0.29174041748046875, -0.262542724609375, -0.23334503173828125, -0.2041473388671875, -0.17494964599609375, -0.145751953125, -0.11655426025390625, -0.0873565673828125, -0.05815887451171875, -0.028961181640625, 0.00023651123046875, 0.0294342041015625, 0.05863189697265625, 0.08782958984375, 0.11702728271484375, 0.1462249755859375, 0.17542266845703125, 0.204620361328125, 0.23381805419921875, 0.2630157470703125, 0.29221343994140625, 0.3214111328125, 0.35060882568359375, 0.3798065185546875, 0.40900421142578125, 0.438201904296875, 0.46739959716796875, 0.4965972900390625, 0.5257949829101562, 0.55499267578125, 0.5841903686523438, 0.6133880615234375, 0.6425857543945312, 0.671783447265625, 0.7009811401367188, 0.7301788330078125, 0.7593765258789062, 0.78857421875]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 4.0, 4.0, 4.0, 4.0, 8.0, 15.0, 25.0, 36.0, 45.0, 58.0, 76.0, 100.0, 96.0, 107.0, 82.0, 79.0, 61.0, 61.0, 43.0, 27.0, 20.0, 21.0, 9.0, 12.0, 7.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1707763671875, -0.1645183563232422, -0.15826034545898438, -0.15200233459472656, -0.14574432373046875, -0.13948631286621094, -0.13322830200195312, -0.1269702911376953, -0.1207122802734375, -0.11445426940917969, -0.10819625854492188, -0.10193824768066406, -0.09568023681640625, -0.08942222595214844, -0.08316421508789062, -0.07690620422363281, -0.070648193359375, -0.06439018249511719, -0.058132171630859375, -0.05187416076660156, -0.04561614990234375, -0.03935813903808594, -0.033100128173828125, -0.026842117309570312, -0.0205841064453125, -0.014326095581054688, -0.008068084716796875, -0.0018100738525390625, 0.00444793701171875, 0.010705947875976562, 0.016963958740234375, 0.023221969604492188, 0.02947998046875, 0.03573799133300781, 0.041996002197265625, 0.04825401306152344, 0.05451202392578125, 0.06077003479003906, 0.06702804565429688, 0.07328605651855469, 0.0795440673828125, 0.08580207824707031, 0.09206008911132812, 0.09831809997558594, 0.10457611083984375, 0.11083412170410156, 0.11709213256835938, 0.12335014343261719, 0.129608154296875, 0.1358661651611328, 0.14212417602539062, 0.14838218688964844, 0.15464019775390625, 0.16089820861816406, 0.16715621948242188, 0.1734142303466797, 0.1796722412109375, 0.1859302520751953, 0.19218826293945312, 0.19844627380371094, 0.20470428466796875, 0.21096229553222656, 0.21722030639648438, 0.2234783172607422, 0.229736328125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 6.0, 8.0, 13.0, 21.0, 38.0, 91.0, 112.0, 263.0, 523.0, 1149.0, 2863.0, 9673.0, 58946.0, 2097616.0, 1955010.0, 54844.0, 8725.0, 2455.0, 918.0, 445.0, 245.0, 120.0, 97.0, 49.0, 29.0, 11.0, 9.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.25146484375, -0.24308013916015625, -0.2346954345703125, -0.22631072998046875, -0.217926025390625, -0.20954132080078125, -0.2011566162109375, -0.19277191162109375, -0.18438720703125, -0.17600250244140625, -0.1676177978515625, -0.15923309326171875, -0.150848388671875, -0.14246368408203125, -0.1340789794921875, -0.12569427490234375, -0.1173095703125, -0.10892486572265625, -0.1005401611328125, -0.09215545654296875, -0.083770751953125, -0.07538604736328125, -0.0670013427734375, -0.05861663818359375, -0.05023193359375, -0.04184722900390625, -0.0334625244140625, -0.02507781982421875, -0.016693115234375, -0.00830841064453125, 7.62939453125e-05, 0.00846099853515625, 0.016845703125, 0.02523040771484375, 0.0336151123046875, 0.04199981689453125, 0.050384521484375, 0.05876922607421875, 0.0671539306640625, 0.07553863525390625, 0.08392333984375, 0.09230804443359375, 0.1006927490234375, 0.10907745361328125, 0.117462158203125, 0.12584686279296875, 0.1342315673828125, 0.14261627197265625, 0.1510009765625, 0.15938568115234375, 0.1677703857421875, 0.17615509033203125, 0.184539794921875, 0.19292449951171875, 0.2013092041015625, 0.20969390869140625, 0.21807861328125, 0.22646331787109375, 0.2348480224609375, 0.24323272705078125, 0.251617431640625, 0.26000213623046875, 0.2683868408203125, 0.27677154541015625, 0.28515625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 8.0, 5.0, 10.0, 8.0, 13.0, 23.0, 35.0, 42.0, 73.0, 153.0, 311.0, 577.0, 907.0, 845.0, 502.0, 253.0, 134.0, 58.0, 45.0, 23.0, 15.0, 9.0, 7.0, 8.0, 2.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.225830078125, -0.21850967407226562, -0.21118927001953125, -0.20386886596679688, -0.1965484619140625, -0.18922805786132812, -0.18190765380859375, -0.17458724975585938, -0.167266845703125, -0.15994644165039062, -0.15262603759765625, -0.14530563354492188, -0.1379852294921875, -0.13066482543945312, -0.12334442138671875, -0.11602401733398438, -0.10870361328125, -0.10138320922851562, -0.09406280517578125, -0.08674240112304688, -0.0794219970703125, -0.07210159301757812, -0.06478118896484375, -0.057460784912109375, -0.050140380859375, -0.042819976806640625, -0.03549957275390625, -0.028179168701171875, -0.0208587646484375, -0.013538360595703125, -0.00621795654296875, 0.001102447509765625, 0.0084228515625, 0.015743255615234375, 0.02306365966796875, 0.030384063720703125, 0.0377044677734375, 0.045024871826171875, 0.05234527587890625, 0.059665679931640625, 0.066986083984375, 0.07430648803710938, 0.08162689208984375, 0.08894729614257812, 0.0962677001953125, 0.10358810424804688, 0.11090850830078125, 0.11822891235351562, 0.12554931640625, 0.13286972045898438, 0.14019012451171875, 0.14751052856445312, 0.1548309326171875, 0.16215133666992188, 0.16947174072265625, 0.17679214477539062, 0.184112548828125, 0.19143295288085938, 0.19875335693359375, 0.20607376098632812, 0.2133941650390625, 0.22071456909179688, 0.22803497314453125, 0.23535537719726562, 0.24267578125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 6.0, 7.0, 20.0, 36.0, 74.0, 129.0, 189.0, 200.0, 163.0, 62.0, 44.0, 30.0, 11.0, 10.0, 8.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.1887683868408203, -2.1335010528564453, -2.0782337188720703, -2.0229663848876953, -1.9676991701126099, -1.9124318361282349, -1.8571646213531494, -1.8018972873687744, -1.7466299533843994, -1.6913626194000244, -1.6360952854156494, -1.580828070640564, -1.525560736656189, -1.470293402671814, -1.4150261878967285, -1.3597588539123535, -1.3044915199279785, -1.2492241859436035, -1.1939568519592285, -1.138689637184143, -1.083422303199768, -1.028154969215393, -0.9728876948356628, -0.9176204204559326, -0.8623530864715576, -0.8070857524871826, -0.7518184781074524, -0.6965512037277222, -0.6412838697433472, -0.5860165357589722, -0.5307492613792419, -0.47548195719718933, -0.4202146530151367, -0.3649473488330841, -0.3096800446510315, -0.2544127404689789, -0.19914543628692627, -0.14387813210487366, -0.08861082792282104, -0.03334352374076843, 0.02192378044128418, 0.07719108462333679, 0.1324583888053894, 0.18772569298744202, 0.24299299716949463, 0.29826030135154724, 0.35352760553359985, 0.40879490971565247, 0.4640622138977051, 0.5193295478820801, 0.5745968222618103, 0.6298640966415405, 0.6851314306259155, 0.7403987646102905, 0.7956660389900208, 0.850933313369751, 0.906200647354126, 0.961467981338501, 1.016735315322876, 1.0720025300979614, 1.1272698640823364, 1.1825371980667114, 1.2378044128417969, 1.2930717468261719, 1.3483390808105469]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 7.0, 6.0, 7.0, 10.0, 11.0, 17.0, 17.0, 27.0, 33.0, 31.0, 41.0, 47.0, 46.0, 63.0, 70.0, 60.0, 65.0, 53.0, 49.0, 59.0, 47.0, 43.0, 44.0, 31.0, 21.0, 20.0, 19.0, 14.0, 17.0, 7.0, 4.0, 6.0, 7.0, 7.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9478108882904053, -0.9135656356811523, -0.8793204426765442, -0.8450751900672913, -0.8108299970626831, -0.7765847444534302, -0.7423394918441772, -0.7080942392349243, -0.6738490462303162, -0.6396037936210632, -0.6053586006164551, -0.5711133480072021, -0.5368680953979492, -0.5026229023933411, -0.46837764978408813, -0.4341324269771576, -0.39988720417022705, -0.3656419813632965, -0.33139675855636597, -0.29715150594711304, -0.2629062831401825, -0.22866106033325195, -0.19441582262516022, -0.16017058491706848, -0.12592536211013794, -0.0916801318526268, -0.05743490159511566, -0.023189671337604523, 0.011055558919906616, 0.04530078172683716, 0.0795460194349289, 0.11379125714302063, 0.14803647994995117, 0.1822817027568817, 0.21652694046497345, 0.2507721781730652, 0.2850174009799957, 0.31926262378692627, 0.3535078763961792, 0.38775309920310974, 0.4219983220100403, 0.4562435448169708, 0.49048876762390137, 0.5247340202331543, 0.5589792728424072, 0.5932244658470154, 0.6274697184562683, 0.6617149114608765, 0.6959601640701294, 0.7302054166793823, 0.7644506096839905, 0.7986958622932434, 0.8329410552978516, 0.8671863079071045, 0.9014315605163574, 0.9356768131256104, 0.9699220061302185, 1.0041671991348267, 1.0384124517440796, 1.0726577043533325, 1.1069029569625854, 1.1411480903625488, 1.1753933429718018, 1.2096385955810547, 1.2438838481903076]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 2.0, 7.0, 8.0, 11.0, 24.0, 21.0, 49.0, 80.0, 94.0, 151.0, 234.0, 419.0, 657.0, 1094.0, 2025.0, 4075.0, 8324.0, 18741.0, 45834.0, 130911.0, 380079.0, 296129.0, 95531.0, 35093.0, 14913.0, 6721.0, 3214.0, 1692.0, 914.0, 521.0, 380.0, 228.0, 127.0, 94.0, 48.0, 49.0, 20.0, 18.0, 4.0, 8.0, 8.0, 5.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.146240234375, -0.1411724090576172, -0.13610458374023438, -0.13103675842285156, -0.12596893310546875, -0.12090110778808594, -0.11583328247070312, -0.11076545715332031, -0.1056976318359375, -0.10062980651855469, -0.09556198120117188, -0.09049415588378906, -0.08542633056640625, -0.08035850524902344, -0.07529067993164062, -0.07022285461425781, -0.065155029296875, -0.06008720397949219, -0.055019378662109375, -0.04995155334472656, -0.04488372802734375, -0.03981590270996094, -0.034748077392578125, -0.029680252075195312, -0.0246124267578125, -0.019544601440429688, -0.014476776123046875, -0.009408950805664062, -0.00434112548828125, 0.0007266998291015625, 0.005794525146484375, 0.010862350463867188, 0.01593017578125, 0.020998001098632812, 0.026065826416015625, 0.031133651733398438, 0.03620147705078125, 0.04126930236816406, 0.046337127685546875, 0.05140495300292969, 0.0564727783203125, 0.06154060363769531, 0.06660842895507812, 0.07167625427246094, 0.07674407958984375, 0.08181190490722656, 0.08687973022460938, 0.09194755554199219, 0.097015380859375, 0.10208320617675781, 0.10715103149414062, 0.11221885681152344, 0.11728668212890625, 0.12235450744628906, 0.12742233276367188, 0.1324901580810547, 0.1375579833984375, 0.1426258087158203, 0.14769363403320312, 0.15276145935058594, 0.15782928466796875, 0.16289710998535156, 0.16796493530273438, 0.1730327606201172, 0.1781005859375]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 8.0, 5.0, 13.0, 17.0, 22.0, 41.0, 43.0, 49.0, 85.0, 71.0, 89.0, 89.0, 97.0, 81.0, 63.0, 46.0, 49.0, 33.0, 28.0, 20.0, 11.0, 10.0, 15.0, 7.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1656494140625, -0.15985107421875, -0.154052734375, -0.14825439453125, -0.1424560546875, -0.13665771484375, -0.130859375, -0.12506103515625, -0.1192626953125, -0.11346435546875, -0.107666015625, -0.10186767578125, -0.0960693359375, -0.09027099609375, -0.08447265625, -0.07867431640625, -0.0728759765625, -0.06707763671875, -0.061279296875, -0.05548095703125, -0.0496826171875, -0.04388427734375, -0.0380859375, -0.03228759765625, -0.0264892578125, -0.02069091796875, -0.014892578125, -0.00909423828125, -0.0032958984375, 0.00250244140625, 0.00830078125, 0.01409912109375, 0.0198974609375, 0.02569580078125, 0.031494140625, 0.03729248046875, 0.0430908203125, 0.04888916015625, 0.0546875, 0.06048583984375, 0.0662841796875, 0.07208251953125, 0.077880859375, 0.08367919921875, 0.0894775390625, 0.09527587890625, 0.10107421875, 0.10687255859375, 0.1126708984375, 0.11846923828125, 0.124267578125, 0.13006591796875, 0.1358642578125, 0.14166259765625, 0.1474609375, 0.15325927734375, 0.1590576171875, 0.16485595703125, 0.170654296875, 0.17645263671875, 0.1822509765625, 0.18804931640625, 0.19384765625, 0.19964599609375, 0.2054443359375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 5.0, 1.0, 8.0, 5.0, 17.0, 19.0, 27.0, 35.0, 86.0, 170.0, 401.0, 1090.0, 4746.0, 56402.0, 891410.0, 85843.0, 6160.0, 1302.0, 439.0, 165.0, 100.0, 51.0, 19.0, 22.0, 14.0, 7.0, 4.0, 7.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.48681640625, -0.46915435791015625, -0.4514923095703125, -0.43383026123046875, -0.416168212890625, -0.39850616455078125, -0.3808441162109375, -0.36318206787109375, -0.34552001953125, -0.32785797119140625, -0.3101959228515625, -0.29253387451171875, -0.274871826171875, -0.25720977783203125, -0.2395477294921875, -0.22188568115234375, -0.2042236328125, -0.18656158447265625, -0.1688995361328125, -0.15123748779296875, -0.133575439453125, -0.11591339111328125, -0.0982513427734375, -0.08058929443359375, -0.06292724609375, -0.04526519775390625, -0.0276031494140625, -0.00994110107421875, 0.007720947265625, 0.02538299560546875, 0.0430450439453125, 0.06070709228515625, 0.078369140625, 0.09603118896484375, 0.1136932373046875, 0.13135528564453125, 0.149017333984375, 0.16667938232421875, 0.1843414306640625, 0.20200347900390625, 0.21966552734375, 0.23732757568359375, 0.2549896240234375, 0.27265167236328125, 0.290313720703125, 0.30797576904296875, 0.3256378173828125, 0.34329986572265625, 0.3609619140625, 0.37862396240234375, 0.3962860107421875, 0.41394805908203125, 0.431610107421875, 0.44927215576171875, 0.4669342041015625, 0.48459625244140625, 0.50225830078125, 0.5199203491210938, 0.5375823974609375, 0.5552444458007812, 0.572906494140625, 0.5905685424804688, 0.6082305908203125, 0.6258926391601562, 0.6435546875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 9.0, 13.0, 15.0, 21.0, 20.0, 23.0, 27.0, 43.0, 51.0, 47.0, 54.0, 50.0, 76.0, 58.0, 66.0, 63.0, 47.0, 49.0, 54.0, 38.0, 35.0, 23.0, 18.0, 26.0, 17.0, 10.0, 6.0, 10.0, 14.0, 7.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.560546875, -0.5442581176757812, -0.5279693603515625, -0.5116806030273438, -0.495391845703125, -0.47910308837890625, -0.4628143310546875, -0.44652557373046875, -0.43023681640625, -0.41394805908203125, -0.3976593017578125, -0.38137054443359375, -0.365081787109375, -0.34879302978515625, -0.3325042724609375, -0.31621551513671875, -0.2999267578125, -0.28363800048828125, -0.2673492431640625, -0.25106048583984375, -0.234771728515625, -0.21848297119140625, -0.2021942138671875, -0.18590545654296875, -0.16961669921875, -0.15332794189453125, -0.1370391845703125, -0.12075042724609375, -0.104461669921875, -0.08817291259765625, -0.0718841552734375, -0.05559539794921875, -0.039306640625, -0.02301788330078125, -0.0067291259765625, 0.00955963134765625, 0.025848388671875, 0.04213714599609375, 0.0584259033203125, 0.07471466064453125, 0.09100341796875, 0.10729217529296875, 0.1235809326171875, 0.13986968994140625, 0.156158447265625, 0.17244720458984375, 0.1887359619140625, 0.20502471923828125, 0.2213134765625, 0.23760223388671875, 0.2538909912109375, 0.27017974853515625, 0.286468505859375, 0.30275726318359375, 0.3190460205078125, 0.33533477783203125, 0.35162353515625, 0.36791229248046875, 0.3842010498046875, 0.40048980712890625, 0.416778564453125, 0.43306732177734375, 0.4493560791015625, 0.46564483642578125, 0.48193359375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 4.0, 3.0, 6.0, 26.0, 14.0, 38.0, 77.0, 136.0, 319.0, 1024.0, 4496.0, 49387.0, 893579.0, 90898.0, 6528.0, 1226.0, 389.0, 187.0, 87.0, 43.0, 25.0, 15.0, 11.0, 12.0, 11.0, 4.0, 2.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.286376953125, -0.2783317565917969, -0.27028656005859375, -0.2622413635253906, -0.2541961669921875, -0.24615097045898438, -0.23810577392578125, -0.23006057739257812, -0.222015380859375, -0.21397018432617188, -0.20592498779296875, -0.19787979125976562, -0.1898345947265625, -0.18178939819335938, -0.17374420166015625, -0.16569900512695312, -0.15765380859375, -0.14960861206054688, -0.14156341552734375, -0.13351821899414062, -0.1254730224609375, -0.11742782592773438, -0.10938262939453125, -0.10133743286132812, -0.093292236328125, -0.08524703979492188, -0.07720184326171875, -0.06915664672851562, -0.0611114501953125, -0.053066253662109375, -0.04502105712890625, -0.036975860595703125, -0.0289306640625, -0.020885467529296875, -0.01284027099609375, -0.004795074462890625, 0.0032501220703125, 0.011295318603515625, 0.01934051513671875, 0.027385711669921875, 0.035430908203125, 0.043476104736328125, 0.05152130126953125, 0.059566497802734375, 0.0676116943359375, 0.07565689086914062, 0.08370208740234375, 0.09174728393554688, 0.09979248046875, 0.10783767700195312, 0.11588287353515625, 0.12392807006835938, 0.1319732666015625, 0.14001846313476562, 0.14806365966796875, 0.15610885620117188, 0.164154052734375, 0.17219924926757812, 0.18024444580078125, 0.18828964233398438, 0.1963348388671875, 0.20438003540039062, 0.21242523193359375, 0.22047042846679688, 0.228515625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 6.0, 7.0, 9.0, 8.0, 15.0, 15.0, 26.0, 19.0, 43.0, 58.0, 92.0, 142.0, 148.0, 123.0, 94.0, 62.0, 47.0, 28.0, 18.0, 12.0, 11.0, 6.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.316205978393555e-05, -9.061768651008606e-05, -8.807331323623657e-05, -8.552893996238708e-05, -8.29845666885376e-05, -8.044019341468811e-05, -7.789582014083862e-05, -7.535144686698914e-05, -7.280707359313965e-05, -7.026270031929016e-05, -6.771832704544067e-05, -6.517395377159119e-05, -6.26295804977417e-05, -6.008520722389221e-05, -5.7540833950042725e-05, -5.499646067619324e-05, -5.245208740234375e-05, -4.990771412849426e-05, -4.7363340854644775e-05, -4.481896758079529e-05, -4.22745943069458e-05, -3.9730221033096313e-05, -3.7185847759246826e-05, -3.464147448539734e-05, -3.209710121154785e-05, -2.9552727937698364e-05, -2.7008354663848877e-05, -2.446398138999939e-05, -2.1919608116149902e-05, -1.9375234842300415e-05, -1.6830861568450928e-05, -1.428648829460144e-05, -1.1742115020751953e-05, -9.197741746902466e-06, -6.6533684730529785e-06, -4.108995199203491e-06, -1.564621925354004e-06, 9.797513484954834e-07, 3.5241246223449707e-06, 6.068497896194458e-06, 8.612871170043945e-06, 1.1157244443893433e-05, 1.370161771774292e-05, 1.6245990991592407e-05, 1.8790364265441895e-05, 2.1334737539291382e-05, 2.387911081314087e-05, 2.6423484086990356e-05, 2.8967857360839844e-05, 3.151223063468933e-05, 3.405660390853882e-05, 3.6600977182388306e-05, 3.914535045623779e-05, 4.168972373008728e-05, 4.423409700393677e-05, 4.6778470277786255e-05, 4.932284355163574e-05, 5.186721682548523e-05, 5.441159009933472e-05, 5.6955963373184204e-05, 5.950033664703369e-05, 6.204470992088318e-05, 6.458908319473267e-05, 6.713345646858215e-05, 6.967782974243164e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 5.0, 5.0, 8.0, 18.0, 26.0, 38.0, 47.0, 88.0, 159.0, 306.0, 563.0, 1382.0, 3990.0, 17310.0, 166090.0, 782866.0, 61911.0, 9281.0, 2499.0, 967.0, 443.0, 235.0, 109.0, 78.0, 54.0, 25.0, 21.0, 8.0, 6.0, 2.0, 4.0, 4.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1778564453125, -0.17217636108398438, -0.16649627685546875, -0.16081619262695312, -0.1551361083984375, -0.14945602416992188, -0.14377593994140625, -0.13809585571289062, -0.132415771484375, -0.12673568725585938, -0.12105560302734375, -0.11537551879882812, -0.1096954345703125, -0.10401535034179688, -0.09833526611328125, -0.09265518188476562, -0.08697509765625, -0.08129501342773438, -0.07561492919921875, -0.06993484497070312, -0.0642547607421875, -0.058574676513671875, -0.05289459228515625, -0.047214508056640625, -0.041534423828125, -0.035854339599609375, -0.03017425537109375, -0.024494171142578125, -0.0188140869140625, -0.013134002685546875, -0.00745391845703125, -0.001773834228515625, 0.00390625, 0.009586334228515625, 0.01526641845703125, 0.020946502685546875, 0.0266265869140625, 0.032306671142578125, 0.03798675537109375, 0.043666839599609375, 0.049346923828125, 0.055027008056640625, 0.06070709228515625, 0.06638717651367188, 0.0720672607421875, 0.07774734497070312, 0.08342742919921875, 0.08910751342773438, 0.09478759765625, 0.10046768188476562, 0.10614776611328125, 0.11182785034179688, 0.1175079345703125, 0.12318801879882812, 0.12886810302734375, 0.13454818725585938, 0.140228271484375, 0.14590835571289062, 0.15158843994140625, 0.15726852416992188, 0.1629486083984375, 0.16862869262695312, 0.17430877685546875, 0.17998886108398438, 0.1856689453125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 0.0, 3.0, 4.0, 5.0, 9.0, 12.0, 20.0, 13.0, 13.0, 33.0, 41.0, 67.0, 84.0, 92.0, 127.0, 111.0, 94.0, 79.0, 53.0, 39.0, 23.0, 23.0, 18.0, 9.0, 10.0, 7.0, 6.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.143310546875, -0.13866043090820312, -0.13401031494140625, -0.12936019897460938, -0.1247100830078125, -0.12005996704101562, -0.11540985107421875, -0.11075973510742188, -0.106109619140625, -0.10145950317382812, -0.09680938720703125, -0.09215927124023438, -0.0875091552734375, -0.08285903930664062, -0.07820892333984375, -0.07355880737304688, -0.06890869140625, -0.06425857543945312, -0.05960845947265625, -0.054958343505859375, -0.0503082275390625, -0.045658111572265625, -0.04100799560546875, -0.036357879638671875, -0.031707763671875, -0.027057647705078125, -0.02240753173828125, -0.017757415771484375, -0.0131072998046875, -0.008457183837890625, -0.00380706787109375, 0.000843048095703125, 0.0054931640625, 0.010143280029296875, 0.01479339599609375, 0.019443511962890625, 0.0240936279296875, 0.028743743896484375, 0.03339385986328125, 0.038043975830078125, 0.042694091796875, 0.047344207763671875, 0.05199432373046875, 0.056644439697265625, 0.0612945556640625, 0.06594467163085938, 0.07059478759765625, 0.07524490356445312, 0.07989501953125, 0.08454513549804688, 0.08919525146484375, 0.09384536743164062, 0.0984954833984375, 0.10314559936523438, 0.10779571533203125, 0.11244583129882812, 0.117095947265625, 0.12174606323242188, 0.12639617919921875, 0.13104629516601562, 0.1356964111328125, 0.14034652709960938, 0.14499664306640625, 0.14964675903320312, 0.154296875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 1.0, 3.0, 1.0, 3.0, 4.0, 5.0, 20.0, 66.0, 173.0, 365.0, 238.0, 78.0, 32.0, 10.0, 8.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0597400665283203, -2.9184553623199463, -2.7771706581115723, -2.6358859539031982, -2.494601249694824, -2.35331654548645, -2.212031841278076, -2.070747137069702, -1.9294624328613281, -1.788177728652954, -1.64689302444458, -1.505608320236206, -1.364323616027832, -1.223038911819458, -1.081754207611084, -0.94046950340271, -0.7991847991943359, -0.6579000949859619, -0.5166153907775879, -0.37533068656921387, -0.23404598236083984, -0.09276127815246582, 0.0485234260559082, 0.18980813026428223, 0.33109283447265625, 0.4723775386810303, 0.6136622428894043, 0.7549469470977783, 0.8962316513061523, 1.0375163555145264, 1.1788010597229004, 1.3200857639312744, 1.4613704681396484, 1.6026551723480225, 1.7439398765563965, 1.8852245807647705, 2.0265092849731445, 2.1677939891815186, 2.3090786933898926, 2.4503633975982666, 2.5916481018066406, 2.7329328060150146, 2.8742175102233887, 3.0155022144317627, 3.1567869186401367, 3.2980716228485107, 3.4393563270568848, 3.580641031265259, 3.721925735473633, 3.863210439682007, 4.004495143890381, 4.145779609680176, 4.287064552307129, 4.428349494934082, 4.569633960723877, 4.710918426513672, 4.852203369140625, 4.993488311767578, 5.134772777557373, 5.276057243347168, 5.417342185974121, 5.558627128601074, 5.699911594390869, 5.841196060180664, 5.982481002807617]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 2.0, 2.0, 10.0, 7.0, 12.0, 13.0, 15.0, 10.0, 13.0, 23.0, 31.0, 32.0, 49.0, 43.0, 36.0, 52.0, 70.0, 81.0, 61.0, 67.0, 60.0, 34.0, 54.0, 38.0, 32.0, 31.0, 24.0, 15.0, 21.0, 18.0, 15.0, 7.0, 7.0, 5.0, 4.0, 6.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4749722480773926, -2.408628225326538, -2.3422842025756836, -2.275940179824829, -2.2095961570739746, -2.14325213432312, -2.0769081115722656, -2.0105643272399902, -1.9442201852798462, -1.8778761625289917, -1.8115321397781372, -1.7451881170272827, -1.6788442134857178, -1.6125001907348633, -1.5461561679840088, -1.4798121452331543, -1.4134681224822998, -1.3471240997314453, -1.2807800769805908, -1.2144360542297363, -1.1480920314788818, -1.0817480087280273, -1.0154041051864624, -0.9490600824356079, -0.8827160596847534, -0.8163720369338989, -0.7500280141830444, -0.6836840510368347, -0.6173400282859802, -0.5509960055351257, -0.48465201258659363, -0.4183080196380615, -0.35196399688720703, -0.28561997413635254, -0.21927598118782043, -0.15293197333812714, -0.08658796548843384, -0.020243942737579346, 0.04610005021095276, 0.11244404315948486, 0.17878806591033936, 0.24513207376003265, 0.31147608160972595, 0.37782007455825806, 0.44416409730911255, 0.510508120059967, 0.5768520832061768, 0.6431961059570312, 0.7095401287078857, 0.7758841514587402, 0.8422281742095947, 0.9085721373558044, 0.9749161601066589, 1.0412602424621582, 1.1076041460037231, 1.1739481687545776, 1.2402921915054321, 1.3066362142562866, 1.3729802370071411, 1.4393242597579956, 1.5056681632995605, 1.572012186050415, 1.6383562088012695, 1.704700231552124, 1.7710442543029785]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 0.0, 3.0, 2.0, 2.0, 5.0, 10.0, 9.0, 15.0, 33.0, 39.0, 79.0, 140.0, 288.0, 571.0, 1343.0, 3751.0, 13661.0, 91097.0, 1614275.0, 2305185.0, 139064.0, 17357.0, 4404.0, 1515.0, 686.0, 314.0, 170.0, 104.0, 81.0, 26.0, 23.0, 20.0, 7.0, 5.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1705322265625, -0.164459228515625, -0.15838623046875, -0.152313232421875, -0.146240234375, -0.140167236328125, -0.13409423828125, -0.128021240234375, -0.1219482421875, -0.115875244140625, -0.10980224609375, -0.103729248046875, -0.09765625, -0.091583251953125, -0.08551025390625, -0.079437255859375, -0.0733642578125, -0.067291259765625, -0.06121826171875, -0.055145263671875, -0.049072265625, -0.042999267578125, -0.03692626953125, -0.030853271484375, -0.0247802734375, -0.018707275390625, -0.01263427734375, -0.006561279296875, -0.00048828125, 0.005584716796875, 0.01165771484375, 0.017730712890625, 0.0238037109375, 0.029876708984375, 0.03594970703125, 0.042022705078125, 0.048095703125, 0.054168701171875, 0.06024169921875, 0.066314697265625, 0.0723876953125, 0.078460693359375, 0.08453369140625, 0.090606689453125, 0.0966796875, 0.102752685546875, 0.10882568359375, 0.114898681640625, 0.1209716796875, 0.127044677734375, 0.13311767578125, 0.139190673828125, 0.145263671875, 0.151336669921875, 0.15740966796875, 0.163482666015625, 0.1695556640625, 0.175628662109375, 0.18170166015625, 0.187774658203125, 0.19384765625, 0.199920654296875, 0.20599365234375, 0.212066650390625, 0.2181396484375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 0.0, 6.0, 13.0, 14.0, 10.0, 13.0, 35.0, 44.0, 58.0, 65.0, 84.0, 111.0, 106.0, 78.0, 79.0, 76.0, 52.0, 44.0, 39.0, 23.0, 17.0, 11.0, 8.0, 10.0, 4.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.165771484375, -0.1597614288330078, -0.15375137329101562, -0.14774131774902344, -0.14173126220703125, -0.13572120666503906, -0.12971115112304688, -0.12370109558105469, -0.1176910400390625, -0.11168098449707031, -0.10567092895507812, -0.09966087341308594, -0.09365081787109375, -0.08764076232910156, -0.08163070678710938, -0.07562065124511719, -0.069610595703125, -0.06360054016113281, -0.057590484619140625, -0.05158042907714844, -0.04557037353515625, -0.03956031799316406, -0.033550262451171875, -0.027540206909179688, -0.0215301513671875, -0.015520095825195312, -0.009510040283203125, -0.0034999847412109375, 0.00251007080078125, 0.008520126342773438, 0.014530181884765625, 0.020540237426757812, 0.02655029296875, 0.03256034851074219, 0.038570404052734375, 0.04458045959472656, 0.05059051513671875, 0.05660057067871094, 0.06261062622070312, 0.06862068176269531, 0.0746307373046875, 0.08064079284667969, 0.08665084838867188, 0.09266090393066406, 0.09867095947265625, 0.10468101501464844, 0.11069107055664062, 0.11670112609863281, 0.122711181640625, 0.1287212371826172, 0.13473129272460938, 0.14074134826660156, 0.14675140380859375, 0.15276145935058594, 0.15877151489257812, 0.1647815704345703, 0.1707916259765625, 0.1768016815185547, 0.18281173706054688, 0.18882179260253906, 0.19483184814453125, 0.20084190368652344, 0.20685195922851562, 0.2128620147705078, 0.2188720703125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 12.0, 9.0, 19.0, 30.0, 32.0, 68.0, 153.0, 334.0, 772.0, 2129.0, 8854.0, 89400.0, 3726889.0, 341366.0, 18270.0, 3967.0, 1127.0, 443.0, 194.0, 89.0, 57.0, 21.0, 14.0, 8.0, 8.0, 8.0, 6.0, 2.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.35400390625, -0.3416595458984375, -0.329315185546875, -0.3169708251953125, -0.30462646484375, -0.2922821044921875, -0.279937744140625, -0.2675933837890625, -0.2552490234375, -0.2429046630859375, -0.230560302734375, -0.2182159423828125, -0.20587158203125, -0.1935272216796875, -0.181182861328125, -0.1688385009765625, -0.156494140625, -0.1441497802734375, -0.131805419921875, -0.1194610595703125, -0.10711669921875, -0.0947723388671875, -0.082427978515625, -0.0700836181640625, -0.0577392578125, -0.0453948974609375, -0.033050537109375, -0.0207061767578125, -0.00836181640625, 0.0039825439453125, 0.016326904296875, 0.0286712646484375, 0.041015625, 0.0533599853515625, 0.065704345703125, 0.0780487060546875, 0.09039306640625, 0.1027374267578125, 0.115081787109375, 0.1274261474609375, 0.1397705078125, 0.1521148681640625, 0.164459228515625, 0.1768035888671875, 0.18914794921875, 0.2014923095703125, 0.213836669921875, 0.2261810302734375, 0.238525390625, 0.2508697509765625, 0.263214111328125, 0.2755584716796875, 0.28790283203125, 0.3002471923828125, 0.312591552734375, 0.3249359130859375, 0.3372802734375, 0.3496246337890625, 0.361968994140625, 0.3743133544921875, 0.38665771484375, 0.3990020751953125, 0.411346435546875, 0.4236907958984375, 0.43603515625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 6.0, 10.0, 9.0, 10.0, 14.0, 16.0, 33.0, 41.0, 69.0, 119.0, 279.0, 484.0, 935.0, 894.0, 569.0, 246.0, 134.0, 73.0, 35.0, 28.0, 17.0, 11.0, 9.0, 7.0, 5.0, 7.0, 4.0, 1.0, 1.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.30322265625, -0.29309844970703125, -0.2829742431640625, -0.27285003662109375, -0.262725830078125, -0.25260162353515625, -0.2424774169921875, -0.23235321044921875, -0.22222900390625, -0.21210479736328125, -0.2019805908203125, -0.19185638427734375, -0.181732177734375, -0.17160797119140625, -0.1614837646484375, -0.15135955810546875, -0.1412353515625, -0.13111114501953125, -0.1209869384765625, -0.11086273193359375, -0.100738525390625, -0.09061431884765625, -0.0804901123046875, -0.07036590576171875, -0.06024169921875, -0.05011749267578125, -0.0399932861328125, -0.02986907958984375, -0.019744873046875, -0.00962066650390625, 0.0005035400390625, 0.01062774658203125, 0.020751953125, 0.03087615966796875, 0.0410003662109375, 0.05112457275390625, 0.061248779296875, 0.07137298583984375, 0.0814971923828125, 0.09162139892578125, 0.10174560546875, 0.11186981201171875, 0.1219940185546875, 0.13211822509765625, 0.142242431640625, 0.15236663818359375, 0.1624908447265625, 0.17261505126953125, 0.1827392578125, 0.19286346435546875, 0.2029876708984375, 0.21311187744140625, 0.223236083984375, 0.23336029052734375, 0.2434844970703125, 0.25360870361328125, 0.26373291015625, 0.27385711669921875, 0.2839813232421875, 0.29410552978515625, 0.304229736328125, 0.31435394287109375, 0.3244781494140625, 0.33460235595703125, 0.3447265625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 1.0, 1.0, 1.0, 2.0, 5.0, 9.0, 15.0, 68.0, 267.0, 390.0, 156.0, 53.0, 12.0, 11.0, 9.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.670238494873047, -5.513584136962891, -5.356929302215576, -5.200274467468262, -5.0436201095581055, -4.886965751647949, -4.730310916900635, -4.57365608215332, -4.417001724243164, -4.260347366333008, -4.103692531585693, -3.947037935256958, -3.7903833389282227, -3.6337287425994873, -3.477074146270752, -3.3204195499420166, -3.1637649536132812, -3.007110357284546, -2.8504557609558105, -2.693801164627075, -2.53714656829834, -2.3804919719696045, -2.223837375640869, -2.067182779312134, -1.9105281829833984, -1.753873586654663, -1.5972189903259277, -1.4405643939971924, -1.283909797668457, -1.1272552013397217, -0.9706006050109863, -0.813946008682251, -0.6572914123535156, -0.5006368160247803, -0.3439822196960449, -0.18732762336730957, -0.03067302703857422, 0.12598156929016113, 0.2826361656188965, 0.43929076194763184, 0.5959453582763672, 0.7525999546051025, 0.9092545509338379, 1.0659091472625732, 1.2225637435913086, 1.379218339920044, 1.5358729362487793, 1.6925275325775146, 1.84918212890625, 2.0058367252349854, 2.1624913215637207, 2.319145917892456, 2.4758005142211914, 2.6324551105499268, 2.789109706878662, 2.9457643032073975, 3.102418899536133, 3.259073495864868, 3.4157280921936035, 3.572382688522339, 3.729037284851074, 3.8856918811798096, 4.042346477508545, 4.199001312255859, 4.355655670166016]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 6.0, 15.0, 11.0, 23.0, 26.0, 27.0, 67.0, 65.0, 69.0, 96.0, 81.0, 94.0, 97.0, 72.0, 62.0, 64.0, 44.0, 26.0, 18.0, 16.0, 13.0, 7.0, 3.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1853229999542236, -2.1063454151153564, -2.0273680686950684, -1.9483904838562012, -1.8694130182266235, -1.790435552597046, -1.7114579677581787, -1.632480502128601, -1.5535030364990234, -1.4745255708694458, -1.3955481052398682, -1.316570520401001, -1.2375930547714233, -1.1586155891418457, -1.0796380043029785, -1.0006605386734009, -0.9216830730438232, -0.8427056074142456, -0.7637280821800232, -0.6847505569458008, -0.6057730913162231, -0.5267956256866455, -0.4478181004524231, -0.3688405752182007, -0.28986310958862305, -0.21088561415672302, -0.131908118724823, -0.052930623292922974, 0.02604687213897705, 0.10502436757087708, 0.1840018630027771, 0.2629793882369995, 0.34195709228515625, 0.4209345877170563, 0.4999120831489563, 0.5788896083831787, 0.6578670740127563, 0.736844539642334, 0.8158220648765564, 0.8947995901107788, 0.9737770557403564, 1.052754521369934, 1.1317319869995117, 1.210709571838379, 1.2896870374679565, 1.3686645030975342, 1.4476420879364014, 1.526619553565979, 1.6055970191955566, 1.6845744848251343, 1.763551950454712, 1.842529535293579, 1.9215070009231567, 2.0004844665527344, 2.0794620513916016, 2.1584396362304688, 2.237416982650757, 2.316394567489624, 2.395371913909912, 2.4743494987487793, 2.5533270835876465, 2.6323044300079346, 2.7112820148468018, 2.79025936126709, 2.869236946105957]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 8.0, 4.0, 13.0, 20.0, 25.0, 37.0, 77.0, 150.0, 200.0, 363.0, 712.0, 1498.0, 3439.0, 8996.0, 26759.0, 90799.0, 322095.0, 411186.0, 126633.0, 35767.0, 11699.0, 4352.0, 1832.0, 891.0, 438.0, 250.0, 123.0, 67.0, 42.0, 28.0, 14.0, 8.0, 12.0, 7.0, 4.0, 3.0, 5.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2337646484375, -0.2271099090576172, -0.22045516967773438, -0.21380043029785156, -0.20714569091796875, -0.20049095153808594, -0.19383621215820312, -0.1871814727783203, -0.1805267333984375, -0.1738719940185547, -0.16721725463867188, -0.16056251525878906, -0.15390777587890625, -0.14725303649902344, -0.14059829711914062, -0.1339435577392578, -0.127288818359375, -0.12063407897949219, -0.11397933959960938, -0.10732460021972656, -0.10066986083984375, -0.09401512145996094, -0.08736038208007812, -0.08070564270019531, -0.0740509033203125, -0.06739616394042969, -0.060741424560546875, -0.05408668518066406, -0.04743194580078125, -0.04077720642089844, -0.034122467041015625, -0.027467727661132812, -0.02081298828125, -0.014158248901367188, -0.007503509521484375, -0.0008487701416015625, 0.00580596923828125, 0.012460708618164062, 0.019115447998046875, 0.025770187377929688, 0.0324249267578125, 0.03907966613769531, 0.045734405517578125, 0.05238914489746094, 0.05904388427734375, 0.06569862365722656, 0.07235336303710938, 0.07900810241699219, 0.085662841796875, 0.09231758117675781, 0.09897232055664062, 0.10562705993652344, 0.11228179931640625, 0.11893653869628906, 0.12559127807617188, 0.1322460174560547, 0.1389007568359375, 0.1455554962158203, 0.15221023559570312, 0.15886497497558594, 0.16551971435546875, 0.17217445373535156, 0.17882919311523438, 0.1854839324951172, 0.192138671875]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 4.0, 2.0, 1.0, 1.0, 3.0, 3.0, 7.0, 12.0, 19.0, 13.0, 29.0, 46.0, 57.0, 59.0, 80.0, 100.0, 75.0, 102.0, 75.0, 90.0, 54.0, 50.0, 48.0, 18.0, 20.0, 13.0, 7.0, 12.0, 1.0, 6.0, 5.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1500244140625, -0.14399337768554688, -0.13796234130859375, -0.13193130493164062, -0.1259002685546875, -0.11986923217773438, -0.11383819580078125, -0.10780715942382812, -0.101776123046875, -0.09574508666992188, -0.08971405029296875, -0.08368301391601562, -0.0776519775390625, -0.07162094116210938, -0.06558990478515625, -0.059558868408203125, -0.05352783203125, -0.047496795654296875, -0.04146575927734375, -0.035434722900390625, -0.0294036865234375, -0.023372650146484375, -0.01734161376953125, -0.011310577392578125, -0.005279541015625, 0.000751495361328125, 0.00678253173828125, 0.012813568115234375, 0.0188446044921875, 0.024875640869140625, 0.03090667724609375, 0.036937713623046875, 0.04296875, 0.048999786376953125, 0.05503082275390625, 0.061061859130859375, 0.0670928955078125, 0.07312393188476562, 0.07915496826171875, 0.08518600463867188, 0.091217041015625, 0.09724807739257812, 0.10327911376953125, 0.10931015014648438, 0.1153411865234375, 0.12137222290039062, 0.12740325927734375, 0.13343429565429688, 0.13946533203125, 0.14549636840820312, 0.15152740478515625, 0.15755844116210938, 0.1635894775390625, 0.16962051391601562, 0.17565155029296875, 0.18168258666992188, 0.187713623046875, 0.19374465942382812, 0.19977569580078125, 0.20580673217773438, 0.2118377685546875, 0.21786880493164062, 0.22389984130859375, 0.22993087768554688, 0.2359619140625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 5.0, 7.0, 6.0, 21.0, 20.0, 27.0, 41.0, 60.0, 96.0, 146.0, 230.0, 434.0, 872.0, 1733.0, 4858.0, 25587.0, 603412.0, 382197.0, 20992.0, 4319.0, 1682.0, 764.0, 420.0, 227.0, 146.0, 89.0, 52.0, 42.0, 22.0, 14.0, 11.0, 5.0, 4.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.57861328125, -0.5620613098144531, -0.5455093383789062, -0.5289573669433594, -0.5124053955078125, -0.4958534240722656, -0.47930145263671875, -0.4627494812011719, -0.446197509765625, -0.4296455383300781, -0.41309356689453125, -0.3965415954589844, -0.3799896240234375, -0.3634376525878906, -0.34688568115234375, -0.3303337097167969, -0.31378173828125, -0.2972297668457031, -0.28067779541015625, -0.2641258239746094, -0.2475738525390625, -0.23102188110351562, -0.21446990966796875, -0.19791793823242188, -0.181365966796875, -0.16481399536132812, -0.14826202392578125, -0.13171005249023438, -0.1151580810546875, -0.09860610961914062, -0.08205413818359375, -0.06550216674804688, -0.0489501953125, -0.032398223876953125, -0.01584625244140625, 0.000705718994140625, 0.0172576904296875, 0.033809661865234375, 0.05036163330078125, 0.06691360473632812, 0.083465576171875, 0.10001754760742188, 0.11656951904296875, 0.13312149047851562, 0.1496734619140625, 0.16622543334960938, 0.18277740478515625, 0.19932937622070312, 0.21588134765625, 0.23243331909179688, 0.24898529052734375, 0.2655372619628906, 0.2820892333984375, 0.2986412048339844, 0.31519317626953125, 0.3317451477050781, 0.348297119140625, 0.3648490905761719, 0.38140106201171875, 0.3979530334472656, 0.4145050048828125, 0.4310569763183594, 0.44760894775390625, 0.4641609191894531, 0.480712890625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 6.0, 9.0, 8.0, 9.0, 6.0, 15.0, 10.0, 24.0, 18.0, 23.0, 33.0, 34.0, 40.0, 31.0, 41.0, 65.0, 60.0, 41.0, 66.0, 58.0, 59.0, 46.0, 51.0, 38.0, 41.0, 29.0, 41.0, 11.0, 24.0, 13.0, 12.0, 8.0, 11.0, 6.0, 4.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.62744140625, -0.6097564697265625, -0.592071533203125, -0.5743865966796875, -0.55670166015625, -0.5390167236328125, -0.521331787109375, -0.5036468505859375, -0.4859619140625, -0.4682769775390625, -0.450592041015625, -0.4329071044921875, -0.41522216796875, -0.3975372314453125, -0.379852294921875, -0.3621673583984375, -0.344482421875, -0.3267974853515625, -0.309112548828125, -0.2914276123046875, -0.27374267578125, -0.2560577392578125, -0.238372802734375, -0.2206878662109375, -0.2030029296875, -0.1853179931640625, -0.167633056640625, -0.1499481201171875, -0.13226318359375, -0.1145782470703125, -0.096893310546875, -0.0792083740234375, -0.0615234375, -0.0438385009765625, -0.026153564453125, -0.0084686279296875, 0.00921630859375, 0.0269012451171875, 0.044586181640625, 0.0622711181640625, 0.0799560546875, 0.0976409912109375, 0.115325927734375, 0.1330108642578125, 0.15069580078125, 0.1683807373046875, 0.186065673828125, 0.2037506103515625, 0.221435546875, 0.2391204833984375, 0.256805419921875, 0.2744903564453125, 0.29217529296875, 0.3098602294921875, 0.327545166015625, 0.3452301025390625, 0.3629150390625, 0.3805999755859375, 0.398284912109375, 0.4159698486328125, 0.43365478515625, 0.4513397216796875, 0.469024658203125, 0.4867095947265625, 0.50439453125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 4.0, 2.0, 10.0, 23.0, 53.0, 115.0, 411.0, 2031.0, 35247.0, 982066.0, 26264.0, 1755.0, 362.0, 125.0, 37.0, 23.0, 4.0, 8.0, 3.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.55908203125, -0.544158935546875, -0.52923583984375, -0.514312744140625, -0.4993896484375, -0.484466552734375, -0.46954345703125, -0.454620361328125, -0.439697265625, -0.424774169921875, -0.40985107421875, -0.394927978515625, -0.3800048828125, -0.365081787109375, -0.35015869140625, -0.335235595703125, -0.3203125, -0.305389404296875, -0.29046630859375, -0.275543212890625, -0.2606201171875, -0.245697021484375, -0.23077392578125, -0.215850830078125, -0.200927734375, -0.186004638671875, -0.17108154296875, -0.156158447265625, -0.1412353515625, -0.126312255859375, -0.11138916015625, -0.096466064453125, -0.08154296875, -0.066619873046875, -0.05169677734375, -0.036773681640625, -0.0218505859375, -0.006927490234375, 0.00799560546875, 0.022918701171875, 0.037841796875, 0.052764892578125, 0.06768798828125, 0.082611083984375, 0.0975341796875, 0.112457275390625, 0.12738037109375, 0.142303466796875, 0.1572265625, 0.172149658203125, 0.18707275390625, 0.201995849609375, 0.2169189453125, 0.231842041015625, 0.24676513671875, 0.261688232421875, 0.276611328125, 0.291534423828125, 0.30645751953125, 0.321380615234375, 0.3363037109375, 0.351226806640625, 0.36614990234375, 0.381072998046875, 0.39599609375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 4.0, 1.0, 5.0, 5.0, 9.0, 9.0, 7.0, 9.0, 17.0, 15.0, 25.0, 24.0, 18.0, 30.0, 49.0, 37.0, 71.0, 69.0, 110.0, 99.0, 83.0, 61.0, 48.0, 33.0, 19.0, 25.0, 22.0, 19.0, 12.0, 9.0, 10.0, 4.0, 8.0, 11.0, 7.0, 3.0, 5.0, 4.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.35981559753418e-05, -6.16004690527916e-05, -5.9602782130241394e-05, -5.760509520769119e-05, -5.560740828514099e-05, -5.360972136259079e-05, -5.161203444004059e-05, -4.961434751749039e-05, -4.7616660594940186e-05, -4.5618973672389984e-05, -4.362128674983978e-05, -4.162359982728958e-05, -3.962591290473938e-05, -3.762822598218918e-05, -3.563053905963898e-05, -3.3632852137088776e-05, -3.1635165214538574e-05, -2.9637478291988373e-05, -2.763979136943817e-05, -2.564210444688797e-05, -2.364441752433777e-05, -2.1646730601787567e-05, -1.9649043679237366e-05, -1.7651356756687164e-05, -1.5653669834136963e-05, -1.3655982911586761e-05, -1.165829598903656e-05, -9.660609066486359e-06, -7.662922143936157e-06, -5.665235221385956e-06, -3.6675482988357544e-06, -1.669861376285553e-06, 3.2782554626464844e-07, 2.32551246881485e-06, 4.323199391365051e-06, 6.320886313915253e-06, 8.318573236465454e-06, 1.0316260159015656e-05, 1.2313947081565857e-05, 1.4311634004116058e-05, 1.630932092666626e-05, 1.830700784921646e-05, 2.0304694771766663e-05, 2.2302381694316864e-05, 2.4300068616867065e-05, 2.6297755539417267e-05, 2.8295442461967468e-05, 3.029312938451767e-05, 3.229081630706787e-05, 3.428850322961807e-05, 3.6286190152168274e-05, 3.8283877074718475e-05, 4.028156399726868e-05, 4.227925091981888e-05, 4.427693784236908e-05, 4.627462476491928e-05, 4.827231168746948e-05, 5.0269998610019684e-05, 5.2267685532569885e-05, 5.426537245512009e-05, 5.626305937767029e-05, 5.826074630022049e-05, 6.025843322277069e-05, 6.225612014532089e-05, 6.42538070678711e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 7.0, 7.0, 7.0, 5.0, 12.0, 26.0, 20.0, 27.0, 30.0, 50.0, 77.0, 76.0, 121.0, 165.0, 213.0, 350.0, 529.0, 848.0, 1483.0, 2891.0, 6320.0, 16259.0, 57081.0, 338537.0, 525284.0, 65938.0, 18141.0, 6780.0, 3144.0, 1516.0, 895.0, 496.0, 318.0, 263.0, 196.0, 123.0, 98.0, 66.0, 34.0, 19.0, 25.0, 16.0, 13.0, 14.0, 8.0, 10.0, 10.0, 9.0, 4.0, 4.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.1385498046875, -0.13435745239257812, -0.13016510009765625, -0.12597274780273438, -0.1217803955078125, -0.11758804321289062, -0.11339569091796875, -0.10920333862304688, -0.105010986328125, -0.10081863403320312, -0.09662628173828125, -0.09243392944335938, -0.0882415771484375, -0.08404922485351562, -0.07985687255859375, -0.07566452026367188, -0.07147216796875, -0.06727981567382812, -0.06308746337890625, -0.058895111083984375, -0.0547027587890625, -0.050510406494140625, -0.04631805419921875, -0.042125701904296875, -0.037933349609375, -0.033740997314453125, -0.02954864501953125, -0.025356292724609375, -0.0211639404296875, -0.016971588134765625, -0.01277923583984375, -0.008586883544921875, -0.00439453125, -0.000202178955078125, 0.00399017333984375, 0.008182525634765625, 0.0123748779296875, 0.016567230224609375, 0.02075958251953125, 0.024951934814453125, 0.029144287109375, 0.033336639404296875, 0.03752899169921875, 0.041721343994140625, 0.0459136962890625, 0.050106048583984375, 0.05429840087890625, 0.058490753173828125, 0.06268310546875, 0.06687545776367188, 0.07106781005859375, 0.07526016235351562, 0.0794525146484375, 0.08364486694335938, 0.08783721923828125, 0.09202957153320312, 0.096221923828125, 0.10041427612304688, 0.10460662841796875, 0.10879898071289062, 0.1129913330078125, 0.11718368530273438, 0.12137603759765625, 0.12556838989257812, 0.1297607421875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 4.0, 6.0, 9.0, 9.0, 18.0, 18.0, 21.0, 23.0, 28.0, 43.0, 70.0, 66.0, 88.0, 74.0, 93.0, 105.0, 89.0, 48.0, 35.0, 36.0, 24.0, 21.0, 21.0, 9.0, 10.0, 9.0, 5.0, 9.0, 2.0, 3.0, 5.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1690673828125, -0.16423606872558594, -0.15940475463867188, -0.1545734405517578, -0.14974212646484375, -0.1449108123779297, -0.14007949829101562, -0.13524818420410156, -0.1304168701171875, -0.12558555603027344, -0.12075424194335938, -0.11592292785644531, -0.11109161376953125, -0.10626029968261719, -0.10142898559570312, -0.09659767150878906, -0.091766357421875, -0.08693504333496094, -0.08210372924804688, -0.07727241516113281, -0.07244110107421875, -0.06760978698730469, -0.06277847290039062, -0.05794715881347656, -0.0531158447265625, -0.04828453063964844, -0.043453216552734375, -0.03862190246582031, -0.03379058837890625, -0.028959274291992188, -0.024127960205078125, -0.019296646118164062, -0.01446533203125, -0.009634017944335938, -0.004802703857421875, 2.86102294921875e-05, 0.00485992431640625, 0.009691238403320312, 0.014522552490234375, 0.019353866577148438, 0.0241851806640625, 0.029016494750976562, 0.033847808837890625, 0.03867912292480469, 0.04351043701171875, 0.04834175109863281, 0.053173065185546875, 0.05800437927246094, 0.062835693359375, 0.06766700744628906, 0.07249832153320312, 0.07732963562011719, 0.08216094970703125, 0.08699226379394531, 0.09182357788085938, 0.09665489196777344, 0.1014862060546875, 0.10631752014160156, 0.11114883422851562, 0.11598014831542969, 0.12081146240234375, 0.1256427764892578, 0.13047409057617188, 0.13530540466308594, 0.14013671875]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 9.0, 6.0, 16.0, 74.0, 228.0, 483.0, 134.0, 36.0, 13.0, 5.0, 5.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.729398727416992, -4.525608062744141, -4.321817398071289, -4.1180267333984375, -3.914236068725586, -3.7104454040527344, -3.506654739379883, -3.3028640747070312, -3.0990734100341797, -2.895282745361328, -2.6914920806884766, -2.487701416015625, -2.2839107513427734, -2.080120086669922, -1.8763294219970703, -1.6725387573242188, -1.4687480926513672, -1.2649574279785156, -1.061166763305664, -0.8573760986328125, -0.6535854339599609, -0.4497947692871094, -0.2460041046142578, -0.04221343994140625, 0.1615772247314453, 0.3653678894042969, 0.5691585540771484, 0.77294921875, 0.9767398834228516, 1.1805305480957031, 1.3843212127685547, 1.5881118774414062, 1.7919025421142578, 1.9956932067871094, 2.199483871459961, 2.4032745361328125, 2.607065200805664, 2.8108558654785156, 3.014646530151367, 3.2184371948242188, 3.4222278594970703, 3.626018524169922, 3.8298091888427734, 4.033599853515625, 4.237390518188477, 4.441181182861328, 4.64497184753418, 4.848762512207031, 5.052553176879883, 5.256343841552734, 5.460134506225586, 5.6639251708984375, 5.867715835571289, 6.071506500244141, 6.275297164916992, 6.479087829589844, 6.682878494262695, 6.886669158935547, 7.090459823608398, 7.29425048828125, 7.498041152954102, 7.701831817626953, 7.905622482299805, 8.109413146972656, 8.313203811645508]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 5.0, 6.0, 2.0, 7.0, 7.0, 10.0, 9.0, 11.0, 9.0, 23.0, 22.0, 27.0, 41.0, 28.0, 24.0, 40.0, 37.0, 25.0, 37.0, 56.0, 57.0, 54.0, 50.0, 57.0, 63.0, 38.0, 31.0, 33.0, 21.0, 21.0, 21.0, 20.0, 19.0, 16.0, 16.0, 10.0, 13.0, 7.0, 8.0, 5.0, 3.0, 7.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6205451488494873, -1.5670948028564453, -1.5136444568634033, -1.4601942300796509, -1.4067438840866089, -1.353293538093567, -1.2998433113098145, -1.2463929653167725, -1.1929426193237305, -1.1394922733306885, -1.0860419273376465, -1.032591700553894, -0.979141354560852, -0.9256910085678101, -0.8722407221794128, -0.8187904357910156, -0.7653400897979736, -0.7118897438049316, -0.6584394574165344, -0.6049891710281372, -0.5515388250350952, -0.4980885088443756, -0.444638192653656, -0.3911878764629364, -0.3377375602722168, -0.2842872440814972, -0.2308369278907776, -0.17738661170005798, -0.12393629550933838, -0.07048597931861877, -0.01703566312789917, 0.036414653062820435, 0.08986496925354004, 0.14331528544425964, 0.19676560163497925, 0.25021591782569885, 0.30366623401641846, 0.35711655020713806, 0.41056686639785767, 0.46401718258857727, 0.5174674987792969, 0.5709178447723389, 0.6243681311607361, 0.6778184175491333, 0.7312687635421753, 0.7847191095352173, 0.8381693959236145, 0.8916196823120117, 0.9450700283050537, 0.9985203742980957, 1.0519707202911377, 1.1054209470748901, 1.1588712930679321, 1.2123216390609741, 1.2657718658447266, 1.3192222118377686, 1.3726725578308105, 1.4261229038238525, 1.4795732498168945, 1.533023476600647, 1.586473822593689, 1.639924168586731, 1.6933743953704834, 1.7468247413635254, 1.8002750873565674]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 6.0, 7.0, 16.0, 19.0, 21.0, 38.0, 83.0, 98.0, 169.0, 315.0, 680.0, 1328.0, 3329.0, 10317.0, 49729.0, 605302.0, 3132854.0, 344786.0, 32764.0, 7463.0, 2626.0, 1121.0, 567.0, 254.0, 139.0, 87.0, 60.0, 36.0, 21.0, 12.0, 8.0, 7.0, 3.0, 3.0, 3.0, 4.0, 6.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1488037109375, -0.14270591735839844, -0.13660812377929688, -0.1305103302001953, -0.12441253662109375, -0.11831474304199219, -0.11221694946289062, -0.10611915588378906, -0.1000213623046875, -0.09392356872558594, -0.08782577514648438, -0.08172798156738281, -0.07563018798828125, -0.06953239440917969, -0.06343460083007812, -0.05733680725097656, -0.051239013671875, -0.04514122009277344, -0.039043426513671875, -0.03294563293457031, -0.02684783935546875, -0.020750045776367188, -0.014652252197265625, -0.008554458618164062, -0.0024566650390625, 0.0036411285400390625, 0.009738922119140625, 0.015836715698242188, 0.02193450927734375, 0.028032302856445312, 0.034130096435546875, 0.04022789001464844, 0.04632568359375, 0.05242347717285156, 0.058521270751953125, 0.06461906433105469, 0.07071685791015625, 0.07681465148925781, 0.08291244506835938, 0.08901023864746094, 0.0951080322265625, 0.10120582580566406, 0.10730361938476562, 0.11340141296386719, 0.11949920654296875, 0.1255970001220703, 0.13169479370117188, 0.13779258728027344, 0.143890380859375, 0.14998817443847656, 0.15608596801757812, 0.1621837615966797, 0.16828155517578125, 0.1743793487548828, 0.18047714233398438, 0.18657493591308594, 0.1926727294921875, 0.19877052307128906, 0.20486831665039062, 0.2109661102294922, 0.21706390380859375, 0.2231616973876953, 0.22925949096679688, 0.23535728454589844, 0.241455078125]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 7.0, 7.0, 4.0, 12.0, 15.0, 25.0, 41.0, 52.0, 49.0, 69.0, 76.0, 72.0, 78.0, 69.0, 89.0, 77.0, 75.0, 47.0, 33.0, 21.0, 31.0, 16.0, 12.0, 5.0, 6.0, 3.0, 6.0, 4.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.155517578125, -0.14977645874023438, -0.14403533935546875, -0.13829421997070312, -0.1325531005859375, -0.12681198120117188, -0.12107086181640625, -0.11532974243164062, -0.109588623046875, -0.10384750366210938, -0.09810638427734375, -0.09236526489257812, -0.0866241455078125, -0.08088302612304688, -0.07514190673828125, -0.06940078735351562, -0.06365966796875, -0.057918548583984375, -0.05217742919921875, -0.046436309814453125, -0.0406951904296875, -0.034954071044921875, -0.02921295166015625, -0.023471832275390625, -0.017730712890625, -0.011989593505859375, -0.00624847412109375, -0.000507354736328125, 0.0052337646484375, 0.010974884033203125, 0.01671600341796875, 0.022457122802734375, 0.0281982421875, 0.033939361572265625, 0.03968048095703125, 0.045421600341796875, 0.0511627197265625, 0.056903839111328125, 0.06264495849609375, 0.06838607788085938, 0.074127197265625, 0.07986831665039062, 0.08560943603515625, 0.09135055541992188, 0.0970916748046875, 0.10283279418945312, 0.10857391357421875, 0.11431503295898438, 0.12005615234375, 0.12579727172851562, 0.13153839111328125, 0.13727951049804688, 0.1430206298828125, 0.14876174926757812, 0.15450286865234375, 0.16024398803710938, 0.165985107421875, 0.17172622680664062, 0.17746734619140625, 0.18320846557617188, 0.1889495849609375, 0.19469070434570312, 0.20043182373046875, 0.20617294311523438, 0.2119140625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 6.0, 3.0, 3.0, 5.0, 5.0, 12.0, 5.0, 15.0, 25.0, 49.0, 71.0, 97.0, 160.0, 321.0, 589.0, 1034.0, 2155.0, 5270.0, 15900.0, 75454.0, 1097958.0, 2790783.0, 164776.0, 26761.0, 7352.0, 2671.0, 1198.0, 675.0, 359.0, 195.0, 130.0, 83.0, 54.0, 42.0, 33.0, 15.0, 11.0, 7.0, 7.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1868896484375, -0.1797504425048828, -0.17261123657226562, -0.16547203063964844, -0.15833282470703125, -0.15119361877441406, -0.14405441284179688, -0.1369152069091797, -0.1297760009765625, -0.12263679504394531, -0.11549758911132812, -0.10835838317871094, -0.10121917724609375, -0.09407997131347656, -0.08694076538085938, -0.07980155944824219, -0.072662353515625, -0.06552314758300781, -0.058383941650390625, -0.05124473571777344, -0.04410552978515625, -0.03696632385253906, -0.029827117919921875, -0.022687911987304688, -0.0155487060546875, -0.008409500122070312, -0.001270294189453125, 0.0058689117431640625, 0.01300811767578125, 0.020147323608398438, 0.027286529541015625, 0.03442573547363281, 0.04156494140625, 0.04870414733886719, 0.055843353271484375, 0.06298255920410156, 0.07012176513671875, 0.07726097106933594, 0.08440017700195312, 0.09153938293457031, 0.0986785888671875, 0.10581779479980469, 0.11295700073242188, 0.12009620666503906, 0.12723541259765625, 0.13437461853027344, 0.14151382446289062, 0.1486530303955078, 0.155792236328125, 0.1629314422607422, 0.17007064819335938, 0.17720985412597656, 0.18434906005859375, 0.19148826599121094, 0.19862747192382812, 0.2057666778564453, 0.2129058837890625, 0.2200450897216797, 0.22718429565429688, 0.23432350158691406, 0.24146270751953125, 0.24860191345214844, 0.2557411193847656, 0.2628803253173828, 0.27001953125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 8.0, 8.0, 15.0, 19.0, 22.0, 39.0, 73.0, 125.0, 253.0, 461.0, 843.0, 900.0, 574.0, 334.0, 146.0, 84.0, 48.0, 39.0, 19.0, 20.0, 13.0, 12.0, 2.0, 3.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.33056640625, -0.3205986022949219, -0.31063079833984375, -0.3006629943847656, -0.2906951904296875, -0.2807273864746094, -0.27075958251953125, -0.2607917785644531, -0.250823974609375, -0.24085617065429688, -0.23088836669921875, -0.22092056274414062, -0.2109527587890625, -0.20098495483398438, -0.19101715087890625, -0.18104934692382812, -0.17108154296875, -0.16111373901367188, -0.15114593505859375, -0.14117813110351562, -0.1312103271484375, -0.12124252319335938, -0.11127471923828125, -0.10130691528320312, -0.091339111328125, -0.08137130737304688, -0.07140350341796875, -0.061435699462890625, -0.0514678955078125, -0.041500091552734375, -0.03153228759765625, -0.021564483642578125, -0.0115966796875, -0.001628875732421875, 0.00833892822265625, 0.018306732177734375, 0.0282745361328125, 0.038242340087890625, 0.04821014404296875, 0.058177947998046875, 0.068145751953125, 0.07811355590820312, 0.08808135986328125, 0.09804916381835938, 0.1080169677734375, 0.11798477172851562, 0.12795257568359375, 0.13792037963867188, 0.14788818359375, 0.15785598754882812, 0.16782379150390625, 0.17779159545898438, 0.1877593994140625, 0.19772720336914062, 0.20769500732421875, 0.21766281127929688, 0.227630615234375, 0.23759841918945312, 0.24756622314453125, 0.2575340270996094, 0.2675018310546875, 0.2774696350097656, 0.28743743896484375, 0.2974052429199219, 0.307373046875]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 3.0, 3.0, 9.0, 13.0, 51.0, 124.0, 255.0, 275.0, 159.0, 52.0, 34.0, 8.0, 9.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.749657392501831, -3.6328115463256836, -3.5159659385681152, -3.3991200923919678, -3.2822744846343994, -3.165428638458252, -3.0485830307006836, -2.931737184524536, -2.8148913383483887, -2.698045492172241, -2.581199884414673, -2.4643540382385254, -2.347508430480957, -2.2306625843048096, -2.113816738128662, -1.9969711303710938, -1.8801255226135254, -1.7632797956466675, -1.6464340686798096, -1.529588222503662, -1.4127426147460938, -1.2958967685699463, -1.1790510416030884, -1.0622053146362305, -0.9453595876693726, -0.8285138607025146, -0.7116681337356567, -0.594822347164154, -0.47797662019729614, -0.36113089323043823, -0.24428510665893555, -0.12743937969207764, -0.010593414306640625, 0.10625232756137848, 0.22309806942939758, 0.3399438261985779, 0.4567895531654358, 0.5736352801322937, 0.6904810667037964, 0.8073267936706543, 0.9241725206375122, 1.0410182476043701, 1.157863974571228, 1.274709701538086, 1.3915555477142334, 1.5084011554718018, 1.6252470016479492, 1.7420927286148071, 1.858938455581665, 1.975784182548523, 2.092629909515381, 2.2094757556915283, 2.3263213634490967, 2.443167209625244, 2.5600128173828125, 2.67685866355896, 2.7937045097351074, 2.910550355911255, 3.0273959636688232, 3.1442418098449707, 3.261087417602539, 3.3779332637786865, 3.494779109954834, 3.6116247177124023, 3.7284703254699707]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 0.0, 1.0, 4.0, 3.0, 6.0, 8.0, 13.0, 15.0, 23.0, 25.0, 24.0, 23.0, 28.0, 43.0, 46.0, 46.0, 54.0, 53.0, 68.0, 58.0, 58.0, 70.0, 56.0, 50.0, 48.0, 43.0, 23.0, 30.0, 20.0, 13.0, 15.0, 12.0, 7.0, 7.0, 7.0, 3.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3352372646331787, -1.292466402053833, -1.2496955394744873, -1.2069246768951416, -1.1641539335250854, -1.1213830709457397, -1.078612208366394, -1.0358413457870483, -0.9930705428123474, -0.9502996802330017, -0.9075288772583008, -0.8647580146789551, -0.8219871520996094, -0.7792163491249084, -0.7364454865455627, -0.6936746835708618, -0.6509038209915161, -0.6081329584121704, -0.5653621554374695, -0.5225912928581238, -0.47982046008110046, -0.43704962730407715, -0.39427876472473145, -0.35150793194770813, -0.3087370991706848, -0.2659662663936615, -0.223195418715477, -0.18042457103729248, -0.13765373826026917, -0.09488290548324585, -0.052112042903900146, -0.009341210126876831, 0.033429503440856934, 0.07620034366846085, 0.11897118389606476, 0.16174203157424927, 0.20451286435127258, 0.2472836971282959, 0.2900545597076416, 0.3328253924846649, 0.37559622526168823, 0.41836705803871155, 0.46113789081573486, 0.5039087533950806, 0.5466796159744263, 0.5894504189491272, 0.6322212815284729, 0.6749920845031738, 0.7177629470825195, 0.7605338096618652, 0.8033046126365662, 0.8460754752159119, 0.8888462781906128, 0.9316171407699585, 0.9743880033493042, 1.01715886592865, 1.059929609298706, 1.1027004718780518, 1.1454713344573975, 1.1882421970367432, 1.2310129404067993, 1.273783802986145, 1.3165546655654907, 1.3593255281448364, 1.4020963907241821]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 4.0, 1.0, 0.0, 3.0, 9.0, 8.0, 16.0, 22.0, 15.0, 34.0, 47.0, 105.0, 174.0, 289.0, 562.0, 1118.0, 2405.0, 5979.0, 18251.0, 72091.0, 334520.0, 465959.0, 107239.0, 25963.0, 7782.0, 3024.0, 1387.0, 658.0, 390.0, 215.0, 106.0, 54.0, 35.0, 22.0, 16.0, 16.0, 20.0, 4.0, 6.0, 4.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.271484375, -0.26375770568847656, -0.2560310363769531, -0.2483043670654297, -0.24057769775390625, -0.2328510284423828, -0.22512435913085938, -0.21739768981933594, -0.2096710205078125, -0.20194435119628906, -0.19421768188476562, -0.1864910125732422, -0.17876434326171875, -0.1710376739501953, -0.16331100463867188, -0.15558433532714844, -0.147857666015625, -0.14013099670410156, -0.13240432739257812, -0.12467765808105469, -0.11695098876953125, -0.10922431945800781, -0.10149765014648438, -0.09377098083496094, -0.0860443115234375, -0.07831764221191406, -0.07059097290039062, -0.06286430358886719, -0.05513763427734375, -0.04741096496582031, -0.039684295654296875, -0.03195762634277344, -0.02423095703125, -0.016504287719726562, -0.008777618408203125, -0.0010509490966796875, 0.00667572021484375, 0.014402389526367188, 0.022129058837890625, 0.029855728149414062, 0.0375823974609375, 0.04530906677246094, 0.053035736083984375, 0.06076240539550781, 0.06848907470703125, 0.07621574401855469, 0.08394241333007812, 0.09166908264160156, 0.099395751953125, 0.10712242126464844, 0.11484909057617188, 0.12257575988769531, 0.13030242919921875, 0.1380290985107422, 0.14575576782226562, 0.15348243713378906, 0.1612091064453125, 0.16893577575683594, 0.17666244506835938, 0.1843891143798828, 0.19211578369140625, 0.1998424530029297, 0.20756912231445312, 0.21529579162597656, 0.2230224609375]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 5.0, 6.0, 11.0, 13.0, 25.0, 21.0, 31.0, 49.0, 59.0, 67.0, 75.0, 68.0, 72.0, 74.0, 74.0, 77.0, 61.0, 48.0, 40.0, 38.0, 22.0, 22.0, 13.0, 6.0, 7.0, 10.0, 3.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1483154296875, -0.14284706115722656, -0.13737869262695312, -0.1319103240966797, -0.12644195556640625, -0.12097358703613281, -0.11550521850585938, -0.11003684997558594, -0.1045684814453125, -0.09910011291503906, -0.09363174438476562, -0.08816337585449219, -0.08269500732421875, -0.07722663879394531, -0.07175827026367188, -0.06628990173339844, -0.060821533203125, -0.05535316467285156, -0.049884796142578125, -0.04441642761230469, -0.03894805908203125, -0.03347969055175781, -0.028011322021484375, -0.022542953491210938, -0.0170745849609375, -0.011606216430664062, -0.006137847900390625, -0.0006694793701171875, 0.00479888916015625, 0.010267257690429688, 0.015735626220703125, 0.021203994750976562, 0.02667236328125, 0.03214073181152344, 0.037609100341796875, 0.04307746887207031, 0.04854583740234375, 0.05401420593261719, 0.059482574462890625, 0.06495094299316406, 0.0704193115234375, 0.07588768005371094, 0.08135604858398438, 0.08682441711425781, 0.09229278564453125, 0.09776115417480469, 0.10322952270507812, 0.10869789123535156, 0.114166259765625, 0.11963462829589844, 0.12510299682617188, 0.1305713653564453, 0.13603973388671875, 0.1415081024169922, 0.14697647094726562, 0.15244483947753906, 0.1579132080078125, 0.16338157653808594, 0.16884994506835938, 0.1743183135986328, 0.17978668212890625, 0.1852550506591797, 0.19072341918945312, 0.19619178771972656, 0.20166015625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 9.0, 5.0, 6.0, 15.0, 10.0, 22.0, 24.0, 31.0, 61.0, 72.0, 105.0, 165.0, 270.0, 506.0, 891.0, 1866.0, 5557.0, 26486.0, 286020.0, 668721.0, 45120.0, 7676.0, 2335.0, 1062.0, 558.0, 306.0, 201.0, 137.0, 89.0, 76.0, 46.0, 32.0, 17.0, 13.0, 10.0, 7.0, 9.0, 8.0, 4.0, 6.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.423095703125, -0.4095039367675781, -0.39591217041015625, -0.3823204040527344, -0.3687286376953125, -0.3551368713378906, -0.34154510498046875, -0.3279533386230469, -0.314361572265625, -0.3007698059082031, -0.28717803955078125, -0.2735862731933594, -0.2599945068359375, -0.24640274047851562, -0.23281097412109375, -0.21921920776367188, -0.20562744140625, -0.19203567504882812, -0.17844390869140625, -0.16485214233398438, -0.1512603759765625, -0.13766860961914062, -0.12407684326171875, -0.11048507690429688, -0.096893310546875, -0.08330154418945312, -0.06970977783203125, -0.056118011474609375, -0.0425262451171875, -0.028934478759765625, -0.01534271240234375, -0.001750946044921875, 0.0118408203125, 0.025432586669921875, 0.03902435302734375, 0.052616119384765625, 0.0662078857421875, 0.07979965209960938, 0.09339141845703125, 0.10698318481445312, 0.120574951171875, 0.13416671752929688, 0.14775848388671875, 0.16135025024414062, 0.1749420166015625, 0.18853378295898438, 0.20212554931640625, 0.21571731567382812, 0.22930908203125, 0.24290084838867188, 0.25649261474609375, 0.2700843811035156, 0.2836761474609375, 0.2972679138183594, 0.31085968017578125, 0.3244514465332031, 0.338043212890625, 0.3516349792480469, 0.36522674560546875, 0.3788185119628906, 0.3924102783203125, 0.4060020446777344, 0.41959381103515625, 0.4331855773925781, 0.44677734375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 5.0, 5.0, 6.0, 16.0, 19.0, 21.0, 25.0, 21.0, 48.0, 57.0, 55.0, 45.0, 80.0, 59.0, 71.0, 80.0, 45.0, 51.0, 61.0, 48.0, 36.0, 26.0, 27.0, 25.0, 21.0, 17.0, 11.0, 9.0, 5.0, 1.0, 5.0, 3.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.486083984375, -0.4671974182128906, -0.44831085205078125, -0.4294242858886719, -0.4105377197265625, -0.3916511535644531, -0.37276458740234375, -0.3538780212402344, -0.334991455078125, -0.3161048889160156, -0.29721832275390625, -0.2783317565917969, -0.2594451904296875, -0.24055862426757812, -0.22167205810546875, -0.20278549194335938, -0.18389892578125, -0.16501235961914062, -0.14612579345703125, -0.12723922729492188, -0.1083526611328125, -0.08946609497070312, -0.07057952880859375, -0.051692962646484375, -0.032806396484375, -0.013919830322265625, 0.00496673583984375, 0.023853302001953125, 0.0427398681640625, 0.061626434326171875, 0.08051300048828125, 0.09939956665039062, 0.1182861328125, 0.13717269897460938, 0.15605926513671875, 0.17494583129882812, 0.1938323974609375, 0.21271896362304688, 0.23160552978515625, 0.2504920959472656, 0.269378662109375, 0.2882652282714844, 0.30715179443359375, 0.3260383605957031, 0.3449249267578125, 0.3638114929199219, 0.38269805908203125, 0.4015846252441406, 0.42047119140625, 0.4393577575683594, 0.45824432373046875, 0.4771308898925781, 0.4960174560546875, 0.5149040222167969, 0.5337905883789062, 0.5526771545410156, 0.571563720703125, 0.5904502868652344, 0.6093368530273438, 0.6282234191894531, 0.6471099853515625, 0.6659965515136719, 0.6848831176757812, 0.7037696838378906, 0.72265625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 5.0, 9.0, 6.0, 23.0, 44.0, 97.0, 174.0, 544.0, 2628.0, 50433.0, 958496.0, 33275.0, 2008.0, 483.0, 172.0, 60.0, 41.0, 20.0, 15.0, 9.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.6201171875, -0.6055068969726562, -0.5908966064453125, -0.5762863159179688, -0.561676025390625, -0.5470657348632812, -0.5324554443359375, -0.5178451538085938, -0.50323486328125, -0.48862457275390625, -0.4740142822265625, -0.45940399169921875, -0.444793701171875, -0.43018341064453125, -0.4155731201171875, -0.40096282958984375, -0.3863525390625, -0.37174224853515625, -0.3571319580078125, -0.34252166748046875, -0.327911376953125, -0.31330108642578125, -0.2986907958984375, -0.28408050537109375, -0.26947021484375, -0.25485992431640625, -0.2402496337890625, -0.22563934326171875, -0.211029052734375, -0.19641876220703125, -0.1818084716796875, -0.16719818115234375, -0.152587890625, -0.13797760009765625, -0.1233673095703125, -0.10875701904296875, -0.094146728515625, -0.07953643798828125, -0.0649261474609375, -0.05031585693359375, -0.03570556640625, -0.02109527587890625, -0.0064849853515625, 0.00812530517578125, 0.022735595703125, 0.03734588623046875, 0.0519561767578125, 0.06656646728515625, 0.0811767578125, 0.09578704833984375, 0.1103973388671875, 0.12500762939453125, 0.139617919921875, 0.15422821044921875, 0.1688385009765625, 0.18344879150390625, 0.19805908203125, 0.21266937255859375, 0.2272796630859375, 0.24188995361328125, 0.256500244140625, 0.27111053466796875, 0.2857208251953125, 0.30033111572265625, 0.31494140625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 4.0, 5.0, 4.0, 4.0, 8.0, 7.0, 7.0, 8.0, 12.0, 19.0, 19.0, 24.0, 34.0, 53.0, 81.0, 101.0, 100.0, 97.0, 94.0, 76.0, 50.0, 34.0, 36.0, 24.0, 14.0, 22.0, 16.0, 6.0, 8.0, 3.0, 8.0, 3.0, 5.0, 8.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.198883056640625e-05, -6.000697612762451e-05, -5.8025121688842773e-05, -5.6043267250061035e-05, -5.40614128112793e-05, -5.207955837249756e-05, -5.009770393371582e-05, -4.811584949493408e-05, -4.6133995056152344e-05, -4.4152140617370605e-05, -4.217028617858887e-05, -4.018843173980713e-05, -3.820657730102539e-05, -3.622472286224365e-05, -3.4242868423461914e-05, -3.2261013984680176e-05, -3.0279159545898438e-05, -2.82973051071167e-05, -2.631545066833496e-05, -2.4333596229553223e-05, -2.2351741790771484e-05, -2.0369887351989746e-05, -1.8388032913208008e-05, -1.640617847442627e-05, -1.4424324035644531e-05, -1.2442469596862793e-05, -1.0460615158081055e-05, -8.478760719299316e-06, -6.496906280517578e-06, -4.51505184173584e-06, -2.5331974029541016e-06, -5.513429641723633e-07, 1.430511474609375e-06, 3.4123659133911133e-06, 5.3942203521728516e-06, 7.37607479095459e-06, 9.357929229736328e-06, 1.1339783668518066e-05, 1.3321638107299805e-05, 1.5303492546081543e-05, 1.728534698486328e-05, 1.926720142364502e-05, 2.1249055862426758e-05, 2.3230910301208496e-05, 2.5212764739990234e-05, 2.7194619178771973e-05, 2.917647361755371e-05, 3.115832805633545e-05, 3.314018249511719e-05, 3.5122036933898926e-05, 3.7103891372680664e-05, 3.90857458114624e-05, 4.106760025024414e-05, 4.304945468902588e-05, 4.503130912780762e-05, 4.7013163566589355e-05, 4.8995018005371094e-05, 5.097687244415283e-05, 5.295872688293457e-05, 5.494058132171631e-05, 5.692243576049805e-05, 5.8904290199279785e-05, 6.0886144638061523e-05, 6.286799907684326e-05, 6.4849853515625e-05]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 4.0, 4.0, 4.0, 12.0, 15.0, 15.0, 23.0, 28.0, 52.0, 72.0, 94.0, 156.0, 220.0, 343.0, 580.0, 1074.0, 2370.0, 6193.0, 19751.0, 81089.0, 677399.0, 203977.0, 37442.0, 10432.0, 3570.0, 1599.0, 712.0, 438.0, 283.0, 194.0, 129.0, 85.0, 61.0, 46.0, 19.0, 19.0, 21.0, 16.0, 8.0, 3.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1519775390625, -0.14703369140625, -0.14208984375, -0.13714599609375, -0.1322021484375, -0.12725830078125, -0.122314453125, -0.11737060546875, -0.1124267578125, -0.10748291015625, -0.1025390625, -0.09759521484375, -0.0926513671875, -0.08770751953125, -0.082763671875, -0.07781982421875, -0.0728759765625, -0.06793212890625, -0.06298828125, -0.05804443359375, -0.0531005859375, -0.04815673828125, -0.043212890625, -0.03826904296875, -0.0333251953125, -0.02838134765625, -0.0234375, -0.01849365234375, -0.0135498046875, -0.00860595703125, -0.003662109375, 0.00128173828125, 0.0062255859375, 0.01116943359375, 0.01611328125, 0.02105712890625, 0.0260009765625, 0.03094482421875, 0.035888671875, 0.04083251953125, 0.0457763671875, 0.05072021484375, 0.0556640625, 0.06060791015625, 0.0655517578125, 0.07049560546875, 0.075439453125, 0.08038330078125, 0.0853271484375, 0.09027099609375, 0.09521484375, 0.10015869140625, 0.1051025390625, 0.11004638671875, 0.114990234375, 0.11993408203125, 0.1248779296875, 0.12982177734375, 0.134765625, 0.13970947265625, 0.1446533203125, 0.14959716796875, 0.154541015625, 0.15948486328125, 0.1644287109375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 6.0, 9.0, 7.0, 9.0, 12.0, 9.0, 15.0, 24.0, 34.0, 39.0, 57.0, 65.0, 108.0, 107.0, 115.0, 97.0, 65.0, 46.0, 43.0, 29.0, 32.0, 12.0, 10.0, 16.0, 8.0, 5.0, 13.0, 2.0, 6.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.123291015625, -0.11816596984863281, -0.11304092407226562, -0.10791587829589844, -0.10279083251953125, -0.09766578674316406, -0.09254074096679688, -0.08741569519042969, -0.0822906494140625, -0.07716560363769531, -0.07204055786132812, -0.06691551208496094, -0.06179046630859375, -0.05666542053222656, -0.051540374755859375, -0.04641532897949219, -0.041290283203125, -0.03616523742675781, -0.031040191650390625, -0.025915145874023438, -0.02079010009765625, -0.015665054321289062, -0.010540008544921875, -0.0054149627685546875, -0.0002899169921875, 0.0048351287841796875, 0.009960174560546875, 0.015085220336914062, 0.02021026611328125, 0.025335311889648438, 0.030460357666015625, 0.03558540344238281, 0.04071044921875, 0.04583549499511719, 0.050960540771484375, 0.05608558654785156, 0.06121063232421875, 0.06633567810058594, 0.07146072387695312, 0.07658576965332031, 0.0817108154296875, 0.08683586120605469, 0.09196090698242188, 0.09708595275878906, 0.10221099853515625, 0.10733604431152344, 0.11246109008789062, 0.11758613586425781, 0.122711181640625, 0.1278362274169922, 0.13296127319335938, 0.13808631896972656, 0.14321136474609375, 0.14833641052246094, 0.15346145629882812, 0.1585865020751953, 0.1637115478515625, 0.1688365936279297, 0.17396163940429688, 0.17908668518066406, 0.18421173095703125, 0.18933677673339844, 0.19446182250976562, 0.1995868682861328, 0.2047119140625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 7.0, 9.0, 15.0, 55.0, 165.0, 467.0, 205.0, 57.0, 14.0, 8.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4672179222106934, -3.280125856399536, -3.0930335521698, -2.9059414863586426, -2.7188491821289062, -2.531757116317749, -2.344665050506592, -2.1575727462768555, -1.9704806804656982, -1.7833884954452515, -1.5962963104248047, -1.4092042446136475, -1.2221120595932007, -1.035019874572754, -0.8479278087615967, -0.6608356237411499, -0.4737434387207031, -0.28665128350257874, -0.09955912828445435, 0.08753299713134766, 0.27462518215179443, 0.4617173671722412, 0.6488094329833984, 0.8359016180038452, 1.022993803024292, 1.2100859880447388, 1.3971781730651855, 1.5842702388763428, 1.7713624238967896, 1.9584546089172363, 2.1455466747283936, 2.332638740539551, 2.519730567932129, 2.706822633743286, 2.8939149379730225, 3.0810070037841797, 3.268099308013916, 3.4551913738250732, 3.6422834396362305, 3.829375743865967, 4.016468048095703, 4.2035603523254395, 4.390652179718018, 4.577744483947754, 4.76483678817749, 4.951929092407227, 5.139020919799805, 5.326113224029541, 5.513205051422119, 5.7002973556518555, 5.887389183044434, 6.07448148727417, 6.261573791503906, 6.448665618896484, 6.635757923126221, 6.822850227355957, 7.009942054748535, 7.1970343589782715, 7.38412618637085, 7.571218490600586, 7.758310794830322, 7.945403099060059, 8.132494926452637, 8.319586753845215, 8.50667953491211]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 2.0, 8.0, 3.0, 8.0, 5.0, 13.0, 14.0, 15.0, 11.0, 16.0, 19.0, 21.0, 25.0, 28.0, 31.0, 28.0, 37.0, 43.0, 58.0, 55.0, 57.0, 82.0, 41.0, 46.0, 37.0, 34.0, 33.0, 32.0, 24.0, 30.0, 19.0, 15.0, 19.0, 14.0, 10.0, 18.0, 7.0, 8.0, 6.0, 9.0, 3.0, 5.0, 6.0, 3.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.5590248107910156, -1.507304072380066, -1.4555834531784058, -1.403862714767456, -1.352142095565796, -1.3004213571548462, -1.2487006187438965, -1.1969799995422363, -1.1452593803405762, -1.0935386419296265, -1.0418180227279663, -0.9900972843170166, -0.9383766651153564, -0.8866559267044067, -0.8349352478981018, -0.7832145690917969, -0.7314938306808472, -0.6797731518745422, -0.6280524730682373, -0.5763317346572876, -0.5246111154556274, -0.4728904068470001, -0.4211696982383728, -0.36944901943206787, -0.31772834062576294, -0.266007661819458, -0.21428696811199188, -0.16256627440452576, -0.11084559559822083, -0.059124916791915894, -0.007404208183288574, 0.04431647062301636, 0.09603714942932129, 0.14775782823562622, 0.19947852194309235, 0.25119921565055847, 0.3029198944568634, 0.35464057326316833, 0.40636128187179565, 0.4580819606781006, 0.5098026394844055, 0.5615233182907104, 0.6132439970970154, 0.6649646759033203, 0.71668541431427, 0.7684060335159302, 0.8201267719268799, 0.8718474507331848, 0.9235681295394897, 0.9752888083457947, 1.0270094871520996, 1.0787302255630493, 1.1304508447647095, 1.1821715831756592, 1.2338922023773193, 1.285612940788269, 1.3373336791992188, 1.3890544176101685, 1.4407750368118286, 1.4924957752227783, 1.5442163944244385, 1.5959371328353882, 1.647657871246338, 1.699378490447998, 1.7510991096496582]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 5.0, 4.0, 6.0, 7.0, 17.0, 16.0, 37.0, 55.0, 105.0, 170.0, 332.0, 665.0, 1815.0, 6036.0, 35722.0, 1005313.0, 3039226.0, 89888.0, 10249.0, 2735.0, 968.0, 422.0, 207.0, 105.0, 73.0, 35.0, 23.0, 19.0, 13.0, 5.0, 8.0, 1.0, 3.0, 8.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2064208984375, -0.19788551330566406, -0.18935012817382812, -0.1808147430419922, -0.17227935791015625, -0.1637439727783203, -0.15520858764648438, -0.14667320251464844, -0.1381378173828125, -0.12960243225097656, -0.12106704711914062, -0.11253166198730469, -0.10399627685546875, -0.09546089172363281, -0.08692550659179688, -0.07839012145996094, -0.069854736328125, -0.06131935119628906, -0.052783966064453125, -0.04424858093261719, -0.03571319580078125, -0.027177810668945312, -0.018642425537109375, -0.010107040405273438, -0.0015716552734375, 0.0069637298583984375, 0.015499114990234375, 0.024034500122070312, 0.03256988525390625, 0.04110527038574219, 0.049640655517578125, 0.05817604064941406, 0.06671142578125, 0.07524681091308594, 0.08378219604492188, 0.09231758117675781, 0.10085296630859375, 0.10938835144042969, 0.11792373657226562, 0.12645912170410156, 0.1349945068359375, 0.14352989196777344, 0.15206527709960938, 0.1606006622314453, 0.16913604736328125, 0.1776714324951172, 0.18620681762695312, 0.19474220275878906, 0.203277587890625, 0.21181297302246094, 0.22034835815429688, 0.2288837432861328, 0.23741912841796875, 0.2459545135498047, 0.2544898986816406, 0.26302528381347656, 0.2715606689453125, 0.28009605407714844, 0.2886314392089844, 0.2971668243408203, 0.30570220947265625, 0.3142375946044922, 0.3227729797363281, 0.33130836486816406, 0.33984375]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 8.0, 9.0, 16.0, 22.0, 23.0, 28.0, 35.0, 45.0, 68.0, 68.0, 75.0, 88.0, 90.0, 56.0, 61.0, 66.0, 60.0, 49.0, 32.0, 29.0, 14.0, 18.0, 15.0, 8.0, 3.0, 5.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1324462890625, -0.12719345092773438, -0.12194061279296875, -0.11668777465820312, -0.1114349365234375, -0.10618209838867188, -0.10092926025390625, -0.09567642211914062, -0.090423583984375, -0.08517074584960938, -0.07991790771484375, -0.07466506958007812, -0.0694122314453125, -0.06415939331054688, -0.05890655517578125, -0.053653717041015625, -0.04840087890625, -0.043148040771484375, -0.03789520263671875, -0.032642364501953125, -0.0273895263671875, -0.022136688232421875, -0.01688385009765625, -0.011631011962890625, -0.006378173828125, -0.001125335693359375, 0.00412750244140625, 0.009380340576171875, 0.0146331787109375, 0.019886016845703125, 0.02513885498046875, 0.030391693115234375, 0.03564453125, 0.040897369384765625, 0.04615020751953125, 0.051403045654296875, 0.0566558837890625, 0.061908721923828125, 0.06716156005859375, 0.07241439819335938, 0.077667236328125, 0.08292007446289062, 0.08817291259765625, 0.09342575073242188, 0.0986785888671875, 0.10393142700195312, 0.10918426513671875, 0.11443710327148438, 0.11968994140625, 0.12494277954101562, 0.13019561767578125, 0.13544845581054688, 0.1407012939453125, 0.14595413208007812, 0.15120697021484375, 0.15645980834960938, 0.161712646484375, 0.16696548461914062, 0.17221832275390625, 0.17747116088867188, 0.1827239990234375, 0.18797683715820312, 0.19322967529296875, 0.19848251342773438, 0.2037353515625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 3.0, 8.0, 13.0, 24.0, 35.0, 46.0, 103.0, 193.0, 406.0, 1001.0, 3348.0, 16199.0, 416883.0, 3693354.0, 53263.0, 6448.0, 1770.0, 654.0, 272.0, 101.0, 54.0, 43.0, 22.0, 20.0, 4.0, 5.0, 7.0, 1.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.37158203125, -0.35794830322265625, -0.3443145751953125, -0.33068084716796875, -0.317047119140625, -0.30341339111328125, -0.2897796630859375, -0.27614593505859375, -0.26251220703125, -0.24887847900390625, -0.2352447509765625, -0.22161102294921875, -0.207977294921875, -0.19434356689453125, -0.1807098388671875, -0.16707611083984375, -0.1534423828125, -0.13980865478515625, -0.1261749267578125, -0.11254119873046875, -0.098907470703125, -0.08527374267578125, -0.0716400146484375, -0.05800628662109375, -0.04437255859375, -0.03073883056640625, -0.0171051025390625, -0.00347137451171875, 0.010162353515625, 0.02379608154296875, 0.0374298095703125, 0.05106353759765625, 0.064697265625, 0.07833099365234375, 0.0919647216796875, 0.10559844970703125, 0.119232177734375, 0.13286590576171875, 0.1464996337890625, 0.16013336181640625, 0.17376708984375, 0.18740081787109375, 0.2010345458984375, 0.21466827392578125, 0.228302001953125, 0.24193572998046875, 0.2555694580078125, 0.26920318603515625, 0.2828369140625, 0.29647064208984375, 0.3101043701171875, 0.32373809814453125, 0.337371826171875, 0.35100555419921875, 0.3646392822265625, 0.37827301025390625, 0.39190673828125, 0.40554046630859375, 0.4191741943359375, 0.43280792236328125, 0.446441650390625, 0.46007537841796875, 0.4737091064453125, 0.48734283447265625, 0.5009765625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 5.0, 6.0, 6.0, 7.0, 21.0, 19.0, 26.0, 54.0, 96.0, 164.0, 343.0, 601.0, 951.0, 824.0, 425.0, 243.0, 127.0, 57.0, 41.0, 12.0, 11.0, 11.0, 9.0, 2.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.304443359375, -0.2948760986328125, -0.285308837890625, -0.2757415771484375, -0.26617431640625, -0.2566070556640625, -0.247039794921875, -0.2374725341796875, -0.2279052734375, -0.2183380126953125, -0.208770751953125, -0.1992034912109375, -0.18963623046875, -0.1800689697265625, -0.170501708984375, -0.1609344482421875, -0.1513671875, -0.1417999267578125, -0.132232666015625, -0.1226654052734375, -0.11309814453125, -0.1035308837890625, -0.093963623046875, -0.0843963623046875, -0.0748291015625, -0.0652618408203125, -0.055694580078125, -0.0461273193359375, -0.03656005859375, -0.0269927978515625, -0.017425537109375, -0.0078582763671875, 0.001708984375, 0.0112762451171875, 0.020843505859375, 0.0304107666015625, 0.03997802734375, 0.0495452880859375, 0.059112548828125, 0.0686798095703125, 0.0782470703125, 0.0878143310546875, 0.097381591796875, 0.1069488525390625, 0.11651611328125, 0.1260833740234375, 0.135650634765625, 0.1452178955078125, 0.15478515625, 0.1643524169921875, 0.173919677734375, 0.1834869384765625, 0.19305419921875, 0.2026214599609375, 0.212188720703125, 0.2217559814453125, 0.2313232421875, 0.2408905029296875, 0.250457763671875, 0.2600250244140625, 0.26959228515625, 0.2791595458984375, 0.288726806640625, 0.2982940673828125, 0.307861328125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 9.0, 6.0, 13.0, 60.0, 187.0, 387.0, 237.0, 67.0, 20.0, 7.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.243610858917236, -7.094602108001709, -6.94559383392334, -6.7965850830078125, -6.647576332092285, -6.498568058013916, -6.349559307098389, -6.2005510330200195, -6.051542282104492, -5.902533531188965, -5.753525257110596, -5.604516506195068, -5.455508232116699, -5.306499481201172, -5.1574907302856445, -5.008481979370117, -4.859473705291748, -4.710464954376221, -4.561456680297852, -4.412447929382324, -4.263439178466797, -4.114430904388428, -3.9654221534729004, -3.816413640975952, -3.667405128479004, -3.5183966159820557, -3.3693881034851074, -3.22037935256958, -3.071370840072632, -2.9223623275756836, -2.7733535766601562, -2.624345064163208, -2.4753365516662598, -2.3263280391693115, -2.1773195266723633, -2.028310775756836, -1.8793022632598877, -1.7302937507629395, -1.5812851190567017, -1.4322764873504639, -1.2832679748535156, -1.1342594623565674, -0.9852508306503296, -0.8362422585487366, -0.6872336864471436, -0.5382251143455505, -0.3892165422439575, -0.24020791053771973, -0.09119939804077148, 0.05780917406082153, 0.20681774616241455, 0.35582631826400757, 0.5048348903656006, 0.6538434624671936, 0.8028520345687866, 0.9518606662750244, 1.1008691787719727, 1.249877691268921, 1.3988863229751587, 1.5478949546813965, 1.6969034671783447, 1.845911979675293, 1.9949206113815308, 2.1439292430877686, 2.292937755584717]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 3.0, 6.0, 5.0, 12.0, 10.0, 17.0, 24.0, 23.0, 22.0, 15.0, 28.0, 41.0, 51.0, 42.0, 49.0, 52.0, 49.0, 58.0, 54.0, 59.0, 51.0, 56.0, 60.0, 36.0, 26.0, 39.0, 28.0, 20.0, 22.0, 12.0, 8.0, 10.0, 3.0, 2.0, 2.0, 6.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0], "bins": [-1.3525437116622925, -1.3168846368789673, -1.2812256813049316, -1.2455666065216064, -1.2099075317382812, -1.174248456954956, -1.1385895013809204, -1.1029304265975952, -1.0672714710235596, -1.0316123962402344, -0.995953381061554, -0.9602943658828735, -0.9246352910995483, -0.8889762759208679, -0.8533172607421875, -0.8176581859588623, -0.7819991111755371, -0.7463400959968567, -0.7106810212135315, -0.6750220060348511, -0.6393629312515259, -0.6037039160728455, -0.568044900894165, -0.5323858261108398, -0.4967268109321594, -0.4610677659511566, -0.4254087209701538, -0.3897497057914734, -0.3540906608104706, -0.3184316158294678, -0.28277260065078735, -0.24711355566978455, -0.2114545702934265, -0.1757955253124237, -0.1401364952325821, -0.10447745770215988, -0.06881842017173767, -0.03315937519073486, 0.0024996548891067505, 0.038158684968948364, 0.07381772994995117, 0.10947676748037338, 0.1451358050107956, 0.1807948350906372, 0.21645388007164001, 0.2521129250526428, 0.28777194023132324, 0.32343098521232605, 0.35909003019332886, 0.39474907517433167, 0.4304081201553345, 0.4660671353340149, 0.5017261505126953, 0.5373852252960205, 0.5730442404747009, 0.6087032556533813, 0.6443623304367065, 0.680021345615387, 0.7156804203987122, 0.7513394355773926, 0.7869985103607178, 0.8226575255393982, 0.8583165407180786, 0.8939756155014038, 0.9296346306800842]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 4.0, 2.0, 4.0, 1.0, 5.0, 6.0, 9.0, 13.0, 13.0, 30.0, 38.0, 42.0, 62.0, 119.0, 174.0, 300.0, 535.0, 997.0, 2067.0, 4803.0, 12622.0, 39549.0, 158708.0, 459028.0, 270080.0, 67153.0, 19480.0, 6765.0, 2939.0, 1323.0, 696.0, 394.0, 204.0, 118.0, 97.0, 45.0, 39.0, 20.0, 20.0, 13.0, 21.0, 4.0, 6.0, 4.0, 2.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17822265625, -0.17241668701171875, -0.1666107177734375, -0.16080474853515625, -0.154998779296875, -0.14919281005859375, -0.1433868408203125, -0.13758087158203125, -0.13177490234375, -0.12596893310546875, -0.1201629638671875, -0.11435699462890625, -0.108551025390625, -0.10274505615234375, -0.0969390869140625, -0.09113311767578125, -0.0853271484375, -0.07952117919921875, -0.0737152099609375, -0.06790924072265625, -0.062103271484375, -0.05629730224609375, -0.0504913330078125, -0.04468536376953125, -0.03887939453125, -0.03307342529296875, -0.0272674560546875, -0.02146148681640625, -0.015655517578125, -0.00984954833984375, -0.0040435791015625, 0.00176239013671875, 0.007568359375, 0.01337432861328125, 0.0191802978515625, 0.02498626708984375, 0.030792236328125, 0.03659820556640625, 0.0424041748046875, 0.04821014404296875, 0.05401611328125, 0.05982208251953125, 0.0656280517578125, 0.07143402099609375, 0.077239990234375, 0.08304595947265625, 0.0888519287109375, 0.09465789794921875, 0.1004638671875, 0.10626983642578125, 0.1120758056640625, 0.11788177490234375, 0.123687744140625, 0.12949371337890625, 0.1352996826171875, 0.14110565185546875, 0.14691162109375, 0.15271759033203125, 0.1585235595703125, 0.16432952880859375, 0.170135498046875, 0.17594146728515625, 0.1817474365234375, 0.18755340576171875, 0.193359375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 7.0, 6.0, 7.0, 14.0, 15.0, 25.0, 31.0, 26.0, 45.0, 54.0, 50.0, 78.0, 65.0, 86.0, 60.0, 64.0, 81.0, 55.0, 45.0, 45.0, 40.0, 23.0, 16.0, 18.0, 15.0, 7.0, 9.0, 5.0, 2.0, 1.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1424560546875, -0.13736724853515625, -0.1322784423828125, -0.12718963623046875, -0.122100830078125, -0.11701202392578125, -0.1119232177734375, -0.10683441162109375, -0.10174560546875, -0.09665679931640625, -0.0915679931640625, -0.08647918701171875, -0.081390380859375, -0.07630157470703125, -0.0712127685546875, -0.06612396240234375, -0.06103515625, -0.05594635009765625, -0.0508575439453125, -0.04576873779296875, -0.040679931640625, -0.03559112548828125, -0.0305023193359375, -0.02541351318359375, -0.02032470703125, -0.01523590087890625, -0.0101470947265625, -0.00505828857421875, 3.0517578125e-05, 0.00511932373046875, 0.0102081298828125, 0.01529693603515625, 0.0203857421875, 0.02547454833984375, 0.0305633544921875, 0.03565216064453125, 0.040740966796875, 0.04582977294921875, 0.0509185791015625, 0.05600738525390625, 0.06109619140625, 0.06618499755859375, 0.0712738037109375, 0.07636260986328125, 0.081451416015625, 0.08654022216796875, 0.0916290283203125, 0.09671783447265625, 0.101806640625, 0.10689544677734375, 0.1119842529296875, 0.11707305908203125, 0.122161865234375, 0.12725067138671875, 0.1323394775390625, 0.13742828369140625, 0.14251708984375, 0.14760589599609375, 0.1526947021484375, 0.15778350830078125, 0.162872314453125, 0.16796112060546875, 0.1730499267578125, 0.17813873291015625, 0.1832275390625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 6.0, 1.0, 7.0, 5.0, 9.0, 9.0, 23.0, 27.0, 37.0, 36.0, 58.0, 94.0, 165.0, 272.0, 797.0, 2630.0, 13688.0, 134983.0, 774224.0, 106507.0, 11251.0, 2291.0, 707.0, 284.0, 152.0, 93.0, 54.0, 35.0, 34.0, 12.0, 20.0, 15.0, 10.0, 7.0, 5.0, 3.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.307861328125, -0.2974090576171875, -0.286956787109375, -0.2765045166015625, -0.26605224609375, -0.2555999755859375, -0.245147705078125, -0.2346954345703125, -0.2242431640625, -0.2137908935546875, -0.203338623046875, -0.1928863525390625, -0.18243408203125, -0.1719818115234375, -0.161529541015625, -0.1510772705078125, -0.140625, -0.1301727294921875, -0.119720458984375, -0.1092681884765625, -0.09881591796875, -0.0883636474609375, -0.077911376953125, -0.0674591064453125, -0.0570068359375, -0.0465545654296875, -0.036102294921875, -0.0256500244140625, -0.01519775390625, -0.0047454833984375, 0.005706787109375, 0.0161590576171875, 0.026611328125, 0.0370635986328125, 0.047515869140625, 0.0579681396484375, 0.06842041015625, 0.0788726806640625, 0.089324951171875, 0.0997772216796875, 0.1102294921875, 0.1206817626953125, 0.131134033203125, 0.1415863037109375, 0.15203857421875, 0.1624908447265625, 0.172943115234375, 0.1833953857421875, 0.19384765625, 0.2042999267578125, 0.214752197265625, 0.2252044677734375, 0.23565673828125, 0.2461090087890625, 0.256561279296875, 0.2670135498046875, 0.2774658203125, 0.2879180908203125, 0.298370361328125, 0.3088226318359375, 0.31927490234375, 0.3297271728515625, 0.340179443359375, 0.3506317138671875, 0.361083984375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 7.0, 8.0, 2.0, 6.0, 8.0, 15.0, 18.0, 13.0, 23.0, 32.0, 38.0, 50.0, 47.0, 51.0, 61.0, 64.0, 60.0, 67.0, 63.0, 54.0, 50.0, 57.0, 45.0, 31.0, 30.0, 24.0, 24.0, 10.0, 16.0, 8.0, 9.0, 5.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.6083984375, -0.5923042297363281, -0.5762100219726562, -0.5601158142089844, -0.5440216064453125, -0.5279273986816406, -0.5118331909179688, -0.4957389831542969, -0.479644775390625, -0.4635505676269531, -0.44745635986328125, -0.4313621520996094, -0.4152679443359375, -0.3991737365722656, -0.38307952880859375, -0.3669853210449219, -0.35089111328125, -0.3347969055175781, -0.31870269775390625, -0.3026084899902344, -0.2865142822265625, -0.2704200744628906, -0.25432586669921875, -0.23823165893554688, -0.222137451171875, -0.20604324340820312, -0.18994903564453125, -0.17385482788085938, -0.1577606201171875, -0.14166641235351562, -0.12557220458984375, -0.10947799682617188, -0.0933837890625, -0.07728958129882812, -0.06119537353515625, -0.045101165771484375, -0.0290069580078125, -0.012912750244140625, 0.00318145751953125, 0.019275665283203125, 0.035369873046875, 0.051464080810546875, 0.06755828857421875, 0.08365249633789062, 0.0997467041015625, 0.11584091186523438, 0.13193511962890625, 0.14802932739257812, 0.16412353515625, 0.18021774291992188, 0.19631195068359375, 0.21240615844726562, 0.2285003662109375, 0.24459457397460938, 0.26068878173828125, 0.2767829895019531, 0.292877197265625, 0.3089714050292969, 0.32506561279296875, 0.3411598205566406, 0.3572540283203125, 0.3733482360839844, 0.38944244384765625, 0.4055366516113281, 0.421630859375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 9.0, 9.0, 23.0, 27.0, 49.0, 108.0, 216.0, 465.0, 1297.0, 3594.0, 12631.0, 68362.0, 691539.0, 228927.0, 30385.0, 7082.0, 2299.0, 881.0, 331.0, 157.0, 69.0, 34.0, 23.0, 13.0, 12.0, 5.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1326904296875, -0.12851524353027344, -0.12434005737304688, -0.12016487121582031, -0.11598968505859375, -0.11181449890136719, -0.10763931274414062, -0.10346412658691406, -0.0992889404296875, -0.09511375427246094, -0.09093856811523438, -0.08676338195800781, -0.08258819580078125, -0.07841300964355469, -0.07423782348632812, -0.07006263732910156, -0.065887451171875, -0.06171226501464844, -0.057537078857421875, -0.05336189270019531, -0.04918670654296875, -0.04501152038574219, -0.040836334228515625, -0.03666114807128906, -0.0324859619140625, -0.028310775756835938, -0.024135589599609375, -0.019960403442382812, -0.01578521728515625, -0.011610031127929688, -0.007434844970703125, -0.0032596588134765625, 0.00091552734375, 0.0050907135009765625, 0.009265899658203125, 0.013441085815429688, 0.01761627197265625, 0.021791458129882812, 0.025966644287109375, 0.030141830444335938, 0.0343170166015625, 0.03849220275878906, 0.042667388916015625, 0.04684257507324219, 0.05101776123046875, 0.05519294738769531, 0.059368133544921875, 0.06354331970214844, 0.067718505859375, 0.07189369201660156, 0.07606887817382812, 0.08024406433105469, 0.08441925048828125, 0.08859443664550781, 0.09276962280273438, 0.09694480895996094, 0.1011199951171875, 0.10529518127441406, 0.10947036743164062, 0.11364555358886719, 0.11782073974609375, 0.12199592590332031, 0.12617111206054688, 0.13034629821777344, 0.134521484375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 0.0, 3.0, 4.0, 7.0, 5.0, 6.0, 11.0, 9.0, 17.0, 23.0, 26.0, 32.0, 43.0, 58.0, 75.0, 81.0, 87.0, 110.0, 88.0, 70.0, 60.0, 52.0, 44.0, 29.0, 13.0, 15.0, 12.0, 7.0, 5.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.112720489501953e-05, -3.980565816164017e-05, -3.84841114282608e-05, -3.716256469488144e-05, -3.5841017961502075e-05, -3.451947122812271e-05, -3.319792449474335e-05, -3.187637776136398e-05, -3.055483102798462e-05, -2.9233284294605255e-05, -2.791173756122589e-05, -2.6590190827846527e-05, -2.5268644094467163e-05, -2.39470973610878e-05, -2.2625550627708435e-05, -2.130400389432907e-05, -1.9982457160949707e-05, -1.8660910427570343e-05, -1.733936369419098e-05, -1.6017816960811615e-05, -1.4696270227432251e-05, -1.3374723494052887e-05, -1.2053176760673523e-05, -1.0731630027294159e-05, -9.410083293914795e-06, -8.088536560535431e-06, -6.766989827156067e-06, -5.445443093776703e-06, -4.123896360397339e-06, -2.802349627017975e-06, -1.4808028936386108e-06, -1.5925616025924683e-07, 1.1622905731201172e-06, 2.483837306499481e-06, 3.8053840398788452e-06, 5.126930773258209e-06, 6.448477506637573e-06, 7.770024240016937e-06, 9.091570973396301e-06, 1.0413117706775665e-05, 1.173466444015503e-05, 1.3056211173534393e-05, 1.4377757906913757e-05, 1.569930464029312e-05, 1.7020851373672485e-05, 1.834239810705185e-05, 1.9663944840431213e-05, 2.0985491573810577e-05, 2.230703830718994e-05, 2.3628585040569305e-05, 2.495013177394867e-05, 2.6271678507328033e-05, 2.7593225240707397e-05, 2.891477197408676e-05, 3.0236318707466125e-05, 3.155786544084549e-05, 3.2879412174224854e-05, 3.420095890760422e-05, 3.552250564098358e-05, 3.6844052374362946e-05, 3.816559910774231e-05, 3.9487145841121674e-05, 4.080869257450104e-05, 4.21302393078804e-05, 4.3451786041259766e-05]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 2.0, 4.0, 7.0, 11.0, 16.0, 14.0, 27.0, 37.0, 42.0, 87.0, 114.0, 193.0, 302.0, 539.0, 941.0, 1704.0, 3545.0, 7512.0, 18110.0, 53544.0, 193757.0, 569166.0, 134005.0, 38552.0, 14109.0, 5887.0, 2816.0, 1504.0, 778.0, 421.0, 268.0, 169.0, 93.0, 81.0, 45.0, 33.0, 34.0, 17.0, 19.0, 11.0, 12.0, 3.0, 8.0, 4.0, 1.0, 3.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.076416015625, -0.07381343841552734, -0.07121086120605469, -0.06860828399658203, -0.06600570678710938, -0.06340312957763672, -0.06080055236816406, -0.058197975158691406, -0.05559539794921875, -0.052992820739746094, -0.05039024353027344, -0.04778766632080078, -0.045185089111328125, -0.04258251190185547, -0.03997993469238281, -0.037377357482910156, -0.0347747802734375, -0.032172203063964844, -0.029569625854492188, -0.02696704864501953, -0.024364471435546875, -0.02176189422607422, -0.019159317016601562, -0.016556739807128906, -0.01395416259765625, -0.011351585388183594, -0.008749008178710938, -0.006146430969238281, -0.003543853759765625, -0.0009412765502929688, 0.0016613006591796875, 0.004263877868652344, 0.006866455078125, 0.009469032287597656, 0.012071609497070312, 0.014674186706542969, 0.017276763916015625, 0.01987934112548828, 0.022481918334960938, 0.025084495544433594, 0.02768707275390625, 0.030289649963378906, 0.03289222717285156, 0.03549480438232422, 0.038097381591796875, 0.04069995880126953, 0.04330253601074219, 0.045905113220214844, 0.0485076904296875, 0.051110267639160156, 0.05371284484863281, 0.05631542205810547, 0.058917999267578125, 0.06152057647705078, 0.06412315368652344, 0.0667257308959961, 0.06932830810546875, 0.0719308853149414, 0.07453346252441406, 0.07713603973388672, 0.07973861694335938, 0.08234119415283203, 0.08494377136230469, 0.08754634857177734, 0.09014892578125]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 6.0, 6.0, 13.0, 17.0, 24.0, 46.0, 58.0, 107.0, 139.0, 156.0, 147.0, 123.0, 58.0, 42.0, 36.0, 9.0, 11.0, 3.0, 3.0, 5.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.274169921875, -0.2684011459350586, -0.2626323699951172, -0.2568635940551758, -0.2510948181152344, -0.24532604217529297, -0.23955726623535156, -0.23378849029541016, -0.22801971435546875, -0.22225093841552734, -0.21648216247558594, -0.21071338653564453, -0.20494461059570312, -0.19917583465576172, -0.1934070587158203, -0.1876382827758789, -0.1818695068359375, -0.1761007308959961, -0.1703319549560547, -0.16456317901611328, -0.15879440307617188, -0.15302562713623047, -0.14725685119628906, -0.14148807525634766, -0.13571929931640625, -0.12995052337646484, -0.12418174743652344, -0.11841297149658203, -0.11264419555664062, -0.10687541961669922, -0.10110664367675781, -0.0953378677368164, -0.089569091796875, -0.0838003158569336, -0.07803153991699219, -0.07226276397705078, -0.06649398803710938, -0.06072521209716797, -0.05495643615722656, -0.049187660217285156, -0.04341888427734375, -0.037650108337402344, -0.03188133239746094, -0.02611255645751953, -0.020343780517578125, -0.014575004577636719, -0.008806228637695312, -0.0030374526977539062, 0.0027313232421875, 0.008500099182128906, 0.014268875122070312, 0.02003765106201172, 0.025806427001953125, 0.03157520294189453, 0.03734397888183594, 0.043112754821777344, 0.04888153076171875, 0.054650306701660156, 0.06041908264160156, 0.06618785858154297, 0.07195663452148438, 0.07772541046142578, 0.08349418640136719, 0.0892629623413086, 0.09503173828125]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 1.0, 3.0, 8.0, 13.0, 35.0, 98.0, 216.0, 363.0, 138.0, 68.0, 27.0, 10.0, 12.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.572631359100342, -4.467034339904785, -4.361437797546387, -4.25584077835083, -4.150243759155273, -4.044646739959717, -3.9390499591827393, -3.8334531784057617, -3.727856159210205, -3.6222591400146484, -3.516662359237671, -3.4110655784606934, -3.3054685592651367, -3.19987154006958, -3.0942747592926025, -2.988677978515625, -2.8830809593200684, -2.7774839401245117, -2.671887159347534, -2.5662903785705566, -2.460693359375, -2.3550963401794434, -2.249499559402466, -2.1439027786254883, -2.0383057594299316, -1.9327088594436646, -1.8271119594573975, -1.7215150594711304, -1.6159181594848633, -1.5103212594985962, -1.404724359512329, -1.299127459526062, -1.193530559539795, -1.0879336595535278, -0.9823367595672607, -0.8767398595809937, -0.7711429595947266, -0.6655460596084595, -0.5599491596221924, -0.4543522596359253, -0.3487553596496582, -0.2431584596633911, -0.13756155967712402, -0.031964659690856934, 0.07363224029541016, 0.17922914028167725, 0.28482604026794434, 0.3904229402542114, 0.4960198402404785, 0.6016167402267456, 0.7072136402130127, 0.8128105401992798, 0.9184074401855469, 1.024004340171814, 1.129601240158081, 1.2351981401443481, 1.3407950401306152, 1.4463919401168823, 1.5519888401031494, 1.6575857400894165, 1.7631826400756836, 1.8687795400619507, 1.9743764400482178, 2.0799732208251953, 2.185570240020752]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 5.0, 2.0, 2.0, 3.0, 9.0, 6.0, 8.0, 9.0, 9.0, 9.0, 13.0, 15.0, 20.0, 17.0, 21.0, 29.0, 28.0, 32.0, 39.0, 35.0, 44.0, 73.0, 68.0, 76.0, 70.0, 57.0, 36.0, 36.0, 31.0, 38.0, 32.0, 24.0, 17.0, 17.0, 16.0, 24.0, 10.0, 10.0, 5.0, 2.0, 4.0, 6.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5206475257873535, -1.469054937362671, -1.4174623489379883, -1.3658697605133057, -1.3142770528793335, -1.2626844644546509, -1.2110918760299683, -1.1594992876052856, -1.107906699180603, -1.0563141107559204, -1.0047215223312378, -0.9531288743019104, -0.9015362858772278, -0.8499436378479004, -0.7983510494232178, -0.7467584609985352, -0.6951658129692078, -0.6435732245445251, -0.5919805765151978, -0.5403879880905151, -0.4887953996658325, -0.4372027814388275, -0.3856101632118225, -0.3340175747871399, -0.2824249565601349, -0.23083235323429108, -0.17923974990844727, -0.12764713168144226, -0.07605452835559845, -0.02446192502975464, 0.027130693197250366, 0.07872328162193298, 0.130315899848938, 0.1819085031747818, 0.2335011065006256, 0.2850937247276306, 0.33668631315231323, 0.38827893137931824, 0.43987154960632324, 0.49146413803100586, 0.5430567264556885, 0.5946493148803711, 0.6462419629096985, 0.6978345513343811, 0.7494271397590637, 0.8010197877883911, 0.8526123762130737, 0.9042049646377563, 0.9557976126670837, 1.0073902606964111, 1.0589828491210938, 1.1105754375457764, 1.162168025970459, 1.2137606143951416, 1.2653532028198242, 1.3169457912445068, 1.368538498878479, 1.4201310873031616, 1.4717236757278442, 1.5233163833618164, 1.574908971786499, 1.6265015602111816, 1.6780941486358643, 1.7296867370605469, 1.7812793254852295]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 1.0, 4.0, 4.0, 12.0, 11.0, 18.0, 39.0, 43.0, 71.0, 158.0, 262.0, 479.0, 950.0, 2357.0, 7320.0, 35959.0, 498633.0, 3269213.0, 342220.0, 26948.0, 5647.0, 2049.0, 851.0, 429.0, 251.0, 138.0, 71.0, 43.0, 37.0, 19.0, 19.0, 4.0, 4.0, 4.0, 3.0, 3.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1619873046875, -0.15535926818847656, -0.14873123168945312, -0.1421031951904297, -0.13547515869140625, -0.1288471221923828, -0.12221908569335938, -0.11559104919433594, -0.1089630126953125, -0.10233497619628906, -0.09570693969726562, -0.08907890319824219, -0.08245086669921875, -0.07582283020019531, -0.06919479370117188, -0.06256675720214844, -0.055938720703125, -0.04931068420410156, -0.042682647705078125, -0.03605461120605469, -0.02942657470703125, -0.022798538208007812, -0.016170501708984375, -0.009542465209960938, -0.0029144287109375, 0.0037136077880859375, 0.010341644287109375, 0.016969680786132812, 0.02359771728515625, 0.030225753784179688, 0.036853790283203125, 0.04348182678222656, 0.05010986328125, 0.05673789978027344, 0.06336593627929688, 0.06999397277832031, 0.07662200927734375, 0.08325004577636719, 0.08987808227539062, 0.09650611877441406, 0.1031341552734375, 0.10976219177246094, 0.11639022827148438, 0.12301826477050781, 0.12964630126953125, 0.1362743377685547, 0.14290237426757812, 0.14953041076660156, 0.156158447265625, 0.16278648376464844, 0.16941452026367188, 0.1760425567626953, 0.18267059326171875, 0.1892986297607422, 0.19592666625976562, 0.20255470275878906, 0.2091827392578125, 0.21581077575683594, 0.22243881225585938, 0.2290668487548828, 0.23569488525390625, 0.2423229217529297, 0.24895095825195312, 0.25557899475097656, 0.26220703125]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 2.0, 5.0, 9.0, 12.0, 11.0, 22.0, 43.0, 31.0, 52.0, 58.0, 71.0, 69.0, 66.0, 81.0, 73.0, 76.0, 59.0, 53.0, 50.0, 48.0, 35.0, 21.0, 14.0, 5.0, 12.0, 6.0, 6.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1458740234375, -0.1405773162841797, -0.13528060913085938, -0.12998390197753906, -0.12468719482421875, -0.11939048767089844, -0.11409378051757812, -0.10879707336425781, -0.1035003662109375, -0.09820365905761719, -0.09290695190429688, -0.08761024475097656, -0.08231353759765625, -0.07701683044433594, -0.07172012329101562, -0.06642341613769531, -0.061126708984375, -0.05583000183105469, -0.050533294677734375, -0.04523658752441406, -0.03993988037109375, -0.03464317321777344, -0.029346466064453125, -0.024049758911132812, -0.0187530517578125, -0.013456344604492188, -0.008159637451171875, -0.0028629302978515625, 0.00243377685546875, 0.0077304840087890625, 0.013027191162109375, 0.018323898315429688, 0.02362060546875, 0.028917312622070312, 0.034214019775390625, 0.03951072692871094, 0.04480743408203125, 0.05010414123535156, 0.055400848388671875, 0.06069755554199219, 0.0659942626953125, 0.07129096984863281, 0.07658767700195312, 0.08188438415527344, 0.08718109130859375, 0.09247779846191406, 0.09777450561523438, 0.10307121276855469, 0.108367919921875, 0.11366462707519531, 0.11896133422851562, 0.12425804138183594, 0.12955474853515625, 0.13485145568847656, 0.14014816284179688, 0.1454448699951172, 0.1507415771484375, 0.1560382843017578, 0.16133499145507812, 0.16663169860839844, 0.17192840576171875, 0.17722511291503906, 0.18252182006835938, 0.1878185272216797, 0.193115234375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 5.0, 2.0, 11.0, 24.0, 47.0, 68.0, 184.0, 430.0, 1618.0, 40316.0, 4125828.0, 23565.0, 1413.0, 456.0, 167.0, 83.0, 29.0, 15.0, 11.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.74072265625, -0.7163925170898438, -0.6920623779296875, -0.6677322387695312, -0.643402099609375, -0.6190719604492188, -0.5947418212890625, -0.5704116821289062, -0.54608154296875, -0.5217514038085938, -0.4974212646484375, -0.47309112548828125, -0.448760986328125, -0.42443084716796875, -0.4001007080078125, -0.37577056884765625, -0.3514404296875, -0.32711029052734375, -0.3027801513671875, -0.27845001220703125, -0.254119873046875, -0.22978973388671875, -0.2054595947265625, -0.18112945556640625, -0.15679931640625, -0.13246917724609375, -0.1081390380859375, -0.08380889892578125, -0.059478759765625, -0.03514862060546875, -0.0108184814453125, 0.01351165771484375, 0.037841796875, 0.06217193603515625, 0.0865020751953125, 0.11083221435546875, 0.135162353515625, 0.15949249267578125, 0.1838226318359375, 0.20815277099609375, 0.23248291015625, 0.25681304931640625, 0.2811431884765625, 0.30547332763671875, 0.329803466796875, 0.35413360595703125, 0.3784637451171875, 0.40279388427734375, 0.4271240234375, 0.45145416259765625, 0.4757843017578125, 0.5001144409179688, 0.524444580078125, 0.5487747192382812, 0.5731048583984375, 0.5974349975585938, 0.62176513671875, 0.6460952758789062, 0.6704254150390625, 0.6947555541992188, 0.719085693359375, 0.7434158325195312, 0.7677459716796875, 0.7920761108398438, 0.81640625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 8.0, 2.0, 3.0, 4.0, 3.0, 10.0, 23.0, 25.0, 35.0, 52.0, 96.0, 177.0, 385.0, 684.0, 886.0, 778.0, 386.0, 215.0, 126.0, 60.0, 44.0, 26.0, 13.0, 10.0, 15.0, 6.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.29541015625, -0.2868804931640625, -0.278350830078125, -0.2698211669921875, -0.26129150390625, -0.2527618408203125, -0.244232177734375, -0.2357025146484375, -0.2271728515625, -0.2186431884765625, -0.210113525390625, -0.2015838623046875, -0.19305419921875, -0.1845245361328125, -0.175994873046875, -0.1674652099609375, -0.158935546875, -0.1504058837890625, -0.141876220703125, -0.1333465576171875, -0.12481689453125, -0.1162872314453125, -0.107757568359375, -0.0992279052734375, -0.0906982421875, -0.0821685791015625, -0.073638916015625, -0.0651092529296875, -0.05657958984375, -0.0480499267578125, -0.039520263671875, -0.0309906005859375, -0.0224609375, -0.0139312744140625, -0.005401611328125, 0.0031280517578125, 0.01165771484375, 0.0201873779296875, 0.028717041015625, 0.0372467041015625, 0.0457763671875, 0.0543060302734375, 0.062835693359375, 0.0713653564453125, 0.07989501953125, 0.0884246826171875, 0.096954345703125, 0.1054840087890625, 0.114013671875, 0.1225433349609375, 0.131072998046875, 0.1396026611328125, 0.14813232421875, 0.1566619873046875, 0.165191650390625, 0.1737213134765625, 0.1822509765625, 0.1907806396484375, 0.199310302734375, 0.2078399658203125, 0.21636962890625, 0.2248992919921875, 0.233428955078125, 0.2419586181640625, 0.25048828125]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 0.0, 4.0, 11.0, 18.0, 51.0, 83.0, 187.0, 253.0, 162.0, 118.0, 55.0, 30.0, 19.0, 7.0, 1.0, 0.0, 8.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.142481565475464, -3.0541329383850098, -2.9657845497131348, -2.8774359226226807, -2.7890872955322266, -2.7007386684417725, -2.6123902797698975, -2.5240416526794434, -2.4356930255889893, -2.347344398498535, -2.25899600982666, -2.170647382736206, -2.082298755645752, -1.9939502477645874, -1.9056017398834229, -1.8172531127929688, -1.7289046049118042, -1.6405560970306396, -1.5522074699401855, -1.463858962059021, -1.375510334968567, -1.2871618270874023, -1.1988131999969482, -1.1104646921157837, -1.0221161842346191, -0.9337676167488098, -0.8454190492630005, -0.7570705413818359, -0.6687219142913818, -0.5803734064102173, -0.49202483892440796, -0.40367627143859863, -0.31532764434814453, -0.2269790768623352, -0.13863052427768707, -0.05028197169303894, 0.038066595792770386, 0.1264151632785797, 0.21476370096206665, 0.303112268447876, 0.3914608359336853, 0.47980940341949463, 0.568157970905304, 0.6565065383911133, 0.7448550462722778, 0.8332036733627319, 0.9215521812438965, 1.0099008083343506, 1.0982493162155151, 1.1865978240966797, 1.2749464511871338, 1.3632949590682983, 1.4516435861587524, 1.539992094039917, 1.628340721130371, 1.7166892290115356, 1.8050377368927002, 1.8933862447738647, 1.9817348718643188, 2.0700833797454834, 2.1584320068359375, 2.2467806339263916, 2.3351290225982666, 2.4234776496887207, 2.511826276779175]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 4.0, 3.0, 3.0, 3.0, 11.0, 7.0, 11.0, 4.0, 11.0, 17.0, 12.0, 22.0, 19.0, 23.0, 22.0, 25.0, 35.0, 36.0, 29.0, 39.0, 35.0, 47.0, 49.0, 60.0, 50.0, 40.0, 46.0, 44.0, 39.0, 38.0, 30.0, 30.0, 30.0, 24.0, 16.0, 19.0, 10.0, 16.0, 8.0, 13.0, 2.0, 4.0, 9.0, 10.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6873423457145691, -0.661778450012207, -0.6362144947052002, -0.6106505990028381, -0.5850867033004761, -0.5595227479934692, -0.5339588522911072, -0.5083949565887451, -0.4828310012817383, -0.45726707577705383, -0.4317031800746918, -0.4061392545700073, -0.3805753290653229, -0.3550114035606384, -0.32944750785827637, -0.3038835823535919, -0.27831968665122986, -0.2527557611465454, -0.22719185054302216, -0.2016279399394989, -0.17606401443481445, -0.1505001038312912, -0.12493619322776794, -0.0993722677230835, -0.07380835711956024, -0.04824443906545639, -0.022680524736642838, 0.0028833895921707153, 0.028447307646274567, 0.05401122570037842, 0.07957513630390167, 0.10513906180858612, 0.13070297241210938, 0.15626688301563263, 0.18183080852031708, 0.20739471912384033, 0.23295864462852478, 0.25852257013320923, 0.2840864658355713, 0.30965039134025574, 0.3352143168449402, 0.36077824234962463, 0.3863421380519867, 0.41190606355667114, 0.4374699890613556, 0.46303391456604004, 0.4885978102684021, 0.5141617059707642, 0.539725661277771, 0.5652895569801331, 0.5908535122871399, 0.616417407989502, 0.641981303691864, 0.6675452589988708, 0.6931091547012329, 0.7186731100082397, 0.744236946105957, 0.7698008418083191, 0.7953647971153259, 0.820928692817688, 0.84649258852005, 0.8720565438270569, 0.897620439529419, 0.9231843948364258, 0.9487482905387878]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 6.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 7.0, 7.0, 15.0, 21.0, 31.0, 45.0, 80.0, 124.0, 252.0, 491.0, 1111.0, 2965.0, 9557.0, 41179.0, 254261.0, 588352.0, 118298.0, 22225.0, 5918.0, 1974.0, 791.0, 375.0, 182.0, 115.0, 64.0, 41.0, 20.0, 15.0, 9.0, 6.0, 7.0, 6.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.181884765625, -0.17440032958984375, -0.1669158935546875, -0.15943145751953125, -0.151947021484375, -0.14446258544921875, -0.1369781494140625, -0.12949371337890625, -0.12200927734375, -0.11452484130859375, -0.1070404052734375, -0.09955596923828125, -0.092071533203125, -0.08458709716796875, -0.0771026611328125, -0.06961822509765625, -0.0621337890625, -0.05464935302734375, -0.0471649169921875, -0.03968048095703125, -0.032196044921875, -0.02471160888671875, -0.0172271728515625, -0.00974273681640625, -0.00225830078125, 0.00522613525390625, 0.0127105712890625, 0.02019500732421875, 0.027679443359375, 0.03516387939453125, 0.0426483154296875, 0.05013275146484375, 0.0576171875, 0.06510162353515625, 0.0725860595703125, 0.08007049560546875, 0.087554931640625, 0.09503936767578125, 0.1025238037109375, 0.11000823974609375, 0.11749267578125, 0.12497711181640625, 0.1324615478515625, 0.13994598388671875, 0.147430419921875, 0.15491485595703125, 0.1623992919921875, 0.16988372802734375, 0.1773681640625, 0.18485260009765625, 0.1923370361328125, 0.19982147216796875, 0.207305908203125, 0.21479034423828125, 0.2222747802734375, 0.22975921630859375, 0.23724365234375, 0.24472808837890625, 0.2522125244140625, 0.25969696044921875, 0.267181396484375, 0.27466583251953125, 0.2821502685546875, 0.28963470458984375, 0.297119140625]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 6.0, 5.0, 4.0, 14.0, 12.0, 9.0, 20.0, 21.0, 28.0, 41.0, 41.0, 57.0, 55.0, 59.0, 66.0, 69.0, 62.0, 69.0, 63.0, 59.0, 47.0, 52.0, 34.0, 31.0, 18.0, 25.0, 9.0, 8.0, 5.0, 6.0, 4.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.132568359375, -0.12762069702148438, -0.12267303466796875, -0.11772537231445312, -0.1127777099609375, -0.10783004760742188, -0.10288238525390625, -0.09793472290039062, -0.092987060546875, -0.08803939819335938, -0.08309173583984375, -0.07814407348632812, -0.0731964111328125, -0.06824874877929688, -0.06330108642578125, -0.058353424072265625, -0.05340576171875, -0.048458099365234375, -0.04351043701171875, -0.038562774658203125, -0.0336151123046875, -0.028667449951171875, -0.02371978759765625, -0.018772125244140625, -0.013824462890625, -0.008876800537109375, -0.00392913818359375, 0.001018524169921875, 0.0059661865234375, 0.010913848876953125, 0.01586151123046875, 0.020809173583984375, 0.0257568359375, 0.030704498291015625, 0.03565216064453125, 0.040599822998046875, 0.0455474853515625, 0.050495147705078125, 0.05544281005859375, 0.060390472412109375, 0.065338134765625, 0.07028579711914062, 0.07523345947265625, 0.08018112182617188, 0.0851287841796875, 0.09007644653320312, 0.09502410888671875, 0.09997177124023438, 0.10491943359375, 0.10986709594726562, 0.11481475830078125, 0.11976242065429688, 0.1247100830078125, 0.12965774536132812, 0.13460540771484375, 0.13955307006835938, 0.144500732421875, 0.14944839477539062, 0.15439605712890625, 0.15934371948242188, 0.1642913818359375, 0.16923904418945312, 0.17418670654296875, 0.17913436889648438, 0.18408203125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 6.0, 7.0, 6.0, 4.0, 4.0, 17.0, 14.0, 31.0, 33.0, 50.0, 87.0, 129.0, 203.0, 362.0, 681.0, 1679.0, 5252.0, 27671.0, 307119.0, 654078.0, 40518.0, 6792.0, 1957.0, 854.0, 383.0, 226.0, 132.0, 80.0, 61.0, 30.0, 25.0, 17.0, 20.0, 9.0, 6.0, 6.0, 4.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.29541015625, -0.28525543212890625, -0.2751007080078125, -0.26494598388671875, -0.254791259765625, -0.24463653564453125, -0.2344818115234375, -0.22432708740234375, -0.21417236328125, -0.20401763916015625, -0.1938629150390625, -0.18370819091796875, -0.173553466796875, -0.16339874267578125, -0.1532440185546875, -0.14308929443359375, -0.1329345703125, -0.12277984619140625, -0.1126251220703125, -0.10247039794921875, -0.092315673828125, -0.08216094970703125, -0.0720062255859375, -0.06185150146484375, -0.05169677734375, -0.04154205322265625, -0.0313873291015625, -0.02123260498046875, -0.011077880859375, -0.00092315673828125, 0.0092315673828125, 0.01938629150390625, 0.029541015625, 0.03969573974609375, 0.0498504638671875, 0.06000518798828125, 0.070159912109375, 0.08031463623046875, 0.0904693603515625, 0.10062408447265625, 0.11077880859375, 0.12093353271484375, 0.1310882568359375, 0.14124298095703125, 0.151397705078125, 0.16155242919921875, 0.1717071533203125, 0.18186187744140625, 0.1920166015625, 0.20217132568359375, 0.2123260498046875, 0.22248077392578125, 0.232635498046875, 0.24279022216796875, 0.2529449462890625, 0.26309967041015625, 0.27325439453125, 0.28340911865234375, 0.2935638427734375, 0.30371856689453125, 0.313873291015625, 0.32402801513671875, 0.3341827392578125, 0.34433746337890625, 0.3544921875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 5.0, 4.0, 8.0, 8.0, 10.0, 20.0, 17.0, 25.0, 25.0, 23.0, 20.0, 39.0, 47.0, 55.0, 50.0, 50.0, 50.0, 49.0, 56.0, 52.0, 33.0, 38.0, 48.0, 45.0, 33.0, 34.0, 31.0, 22.0, 20.0, 16.0, 18.0, 7.0, 6.0, 10.0, 7.0, 4.0, 5.0, 3.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.395263671875, -0.38181304931640625, -0.3683624267578125, -0.35491180419921875, -0.341461181640625, -0.32801055908203125, -0.3145599365234375, -0.30110931396484375, -0.28765869140625, -0.27420806884765625, -0.2607574462890625, -0.24730682373046875, -0.233856201171875, -0.22040557861328125, -0.2069549560546875, -0.19350433349609375, -0.1800537109375, -0.16660308837890625, -0.1531524658203125, -0.13970184326171875, -0.126251220703125, -0.11280059814453125, -0.0993499755859375, -0.08589935302734375, -0.07244873046875, -0.05899810791015625, -0.0455474853515625, -0.03209686279296875, -0.018646240234375, -0.00519561767578125, 0.0082550048828125, 0.02170562744140625, 0.03515625, 0.04860687255859375, 0.0620574951171875, 0.07550811767578125, 0.088958740234375, 0.10240936279296875, 0.1158599853515625, 0.12931060791015625, 0.14276123046875, 0.15621185302734375, 0.1696624755859375, 0.18311309814453125, 0.196563720703125, 0.21001434326171875, 0.2234649658203125, 0.23691558837890625, 0.2503662109375, 0.26381683349609375, 0.2772674560546875, 0.29071807861328125, 0.304168701171875, 0.31761932373046875, 0.3310699462890625, 0.34452056884765625, 0.35797119140625, 0.37142181396484375, 0.3848724365234375, 0.39832305908203125, 0.411773681640625, 0.42522430419921875, 0.4386749267578125, 0.45212554931640625, 0.465576171875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 0.0, 8.0, 2.0, 12.0, 11.0, 9.0, 24.0, 35.0, 34.0, 64.0, 119.0, 162.0, 291.0, 515.0, 875.0, 1654.0, 3484.0, 7712.0, 18637.0, 53515.0, 237853.0, 603765.0, 76444.0, 24722.0, 9591.0, 4299.0, 2098.0, 1105.0, 610.0, 331.0, 215.0, 110.0, 72.0, 64.0, 35.0, 22.0, 19.0, 8.0, 9.0, 11.0, 1.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.08758544921875, -0.08502006530761719, -0.08245468139648438, -0.07988929748535156, -0.07732391357421875, -0.07475852966308594, -0.07219314575195312, -0.06962776184082031, -0.0670623779296875, -0.06449699401855469, -0.061931610107421875, -0.05936622619628906, -0.05680084228515625, -0.05423545837402344, -0.051670074462890625, -0.04910469055175781, -0.046539306640625, -0.04397392272949219, -0.041408538818359375, -0.03884315490722656, -0.03627777099609375, -0.03371238708496094, -0.031147003173828125, -0.028581619262695312, -0.0260162353515625, -0.023450851440429688, -0.020885467529296875, -0.018320083618164062, -0.01575469970703125, -0.013189315795898438, -0.010623931884765625, -0.008058547973632812, -0.0054931640625, -0.0029277801513671875, -0.000362396240234375, 0.0022029876708984375, 0.00476837158203125, 0.0073337554931640625, 0.009899139404296875, 0.012464523315429688, 0.0150299072265625, 0.017595291137695312, 0.020160675048828125, 0.022726058959960938, 0.02529144287109375, 0.027856826782226562, 0.030422210693359375, 0.03298759460449219, 0.035552978515625, 0.03811836242675781, 0.040683746337890625, 0.04324913024902344, 0.04581451416015625, 0.04837989807128906, 0.050945281982421875, 0.05351066589355469, 0.0560760498046875, 0.05864143371582031, 0.061206817626953125, 0.06377220153808594, 0.06633758544921875, 0.06890296936035156, 0.07146835327148438, 0.07403373718261719, 0.07659912109375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 7.0, 3.0, 2.0, 8.0, 10.0, 3.0, 20.0, 17.0, 23.0, 25.0, 40.0, 37.0, 70.0, 106.0, 117.0, 109.0, 85.0, 85.0, 64.0, 44.0, 33.0, 15.0, 20.0, 12.0, 12.0, 11.0, 7.0, 6.0, 5.0, 4.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.8220157623291016e-05, -4.680640995502472e-05, -4.539266228675842e-05, -4.3978914618492126e-05, -4.256516695022583e-05, -4.1151419281959534e-05, -3.973767161369324e-05, -3.832392394542694e-05, -3.6910176277160645e-05, -3.549642860889435e-05, -3.408268094062805e-05, -3.2668933272361755e-05, -3.125518560409546e-05, -2.9841437935829163e-05, -2.8427690267562866e-05, -2.701394259929657e-05, -2.5600194931030273e-05, -2.4186447262763977e-05, -2.277269959449768e-05, -2.1358951926231384e-05, -1.9945204257965088e-05, -1.853145658969879e-05, -1.7117708921432495e-05, -1.57039612531662e-05, -1.4290213584899902e-05, -1.2876465916633606e-05, -1.146271824836731e-05, -1.0048970580101013e-05, -8.635222911834717e-06, -7.22147524356842e-06, -5.807727575302124e-06, -4.393979907035828e-06, -2.9802322387695312e-06, -1.5664845705032349e-06, -1.5273690223693848e-07, 1.261010766029358e-06, 2.6747584342956543e-06, 4.088506102561951e-06, 5.502253770828247e-06, 6.9160014390945435e-06, 8.32974910736084e-06, 9.743496775627136e-06, 1.1157244443893433e-05, 1.2570992112159729e-05, 1.3984739780426025e-05, 1.5398487448692322e-05, 1.6812235116958618e-05, 1.8225982785224915e-05, 1.963973045349121e-05, 2.1053478121757507e-05, 2.2467225790023804e-05, 2.38809734582901e-05, 2.5294721126556396e-05, 2.6708468794822693e-05, 2.812221646308899e-05, 2.9535964131355286e-05, 3.094971179962158e-05, 3.236345946788788e-05, 3.3777207136154175e-05, 3.519095480442047e-05, 3.660470247268677e-05, 3.8018450140953064e-05, 3.943219780921936e-05, 4.084594547748566e-05, 4.225969314575195e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 1.0, 2.0, 13.0, 10.0, 10.0, 17.0, 25.0, 46.0, 71.0, 134.0, 250.0, 490.0, 1155.0, 3317.0, 11096.0, 48220.0, 607503.0, 320029.0, 41232.0, 9797.0, 3003.0, 1087.0, 459.0, 241.0, 149.0, 66.0, 48.0, 39.0, 17.0, 9.0, 8.0, 9.0, 6.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0882568359375, -0.08441162109375, -0.08056640625, -0.07672119140625, -0.0728759765625, -0.06903076171875, -0.065185546875, -0.06134033203125, -0.0574951171875, -0.05364990234375, -0.0498046875, -0.04595947265625, -0.0421142578125, -0.03826904296875, -0.034423828125, -0.03057861328125, -0.0267333984375, -0.02288818359375, -0.01904296875, -0.01519775390625, -0.0113525390625, -0.00750732421875, -0.003662109375, 0.00018310546875, 0.0040283203125, 0.00787353515625, 0.01171875, 0.01556396484375, 0.0194091796875, 0.02325439453125, 0.027099609375, 0.03094482421875, 0.0347900390625, 0.03863525390625, 0.04248046875, 0.04632568359375, 0.0501708984375, 0.05401611328125, 0.057861328125, 0.06170654296875, 0.0655517578125, 0.06939697265625, 0.0732421875, 0.07708740234375, 0.0809326171875, 0.08477783203125, 0.088623046875, 0.09246826171875, 0.0963134765625, 0.10015869140625, 0.10400390625, 0.10784912109375, 0.1116943359375, 0.11553955078125, 0.119384765625, 0.12322998046875, 0.1270751953125, 0.13092041015625, 0.134765625, 0.13861083984375, 0.1424560546875, 0.14630126953125, 0.150146484375, 0.15399169921875, 0.1578369140625]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 7.0, 5.0, 7.0, 6.0, 12.0, 8.0, 16.0, 17.0, 22.0, 29.0, 29.0, 36.0, 78.0, 66.0, 107.0, 136.0, 90.0, 85.0, 60.0, 39.0, 26.0, 23.0, 19.0, 12.0, 13.0, 10.0, 11.0, 8.0, 8.0, 3.0, 7.0, 3.0, 3.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09527587890625, -0.09215068817138672, -0.08902549743652344, -0.08590030670166016, -0.08277511596679688, -0.0796499252319336, -0.07652473449707031, -0.07339954376220703, -0.07027435302734375, -0.06714916229248047, -0.06402397155761719, -0.060898780822753906, -0.057773590087890625, -0.054648399353027344, -0.05152320861816406, -0.04839801788330078, -0.0452728271484375, -0.04214763641357422, -0.03902244567871094, -0.035897254943847656, -0.032772064208984375, -0.029646873474121094, -0.026521682739257812, -0.02339649200439453, -0.02027130126953125, -0.01714611053466797, -0.014020919799804688, -0.010895729064941406, -0.007770538330078125, -0.004645347595214844, -0.0015201568603515625, 0.0016050338745117188, 0.004730224609375, 0.007855415344238281, 0.010980606079101562, 0.014105796813964844, 0.017230987548828125, 0.020356178283691406, 0.023481369018554688, 0.02660655975341797, 0.02973175048828125, 0.03285694122314453, 0.03598213195800781, 0.039107322692871094, 0.042232513427734375, 0.045357704162597656, 0.04848289489746094, 0.05160808563232422, 0.0547332763671875, 0.05785846710205078, 0.06098365783691406, 0.06410884857177734, 0.06723403930664062, 0.0703592300415039, 0.07348442077636719, 0.07660961151123047, 0.07973480224609375, 0.08285999298095703, 0.08598518371582031, 0.0891103744506836, 0.09223556518554688, 0.09536075592041016, 0.09848594665527344, 0.10161113739013672, 0.104736328125]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 3.0, 2.0, 3.0, 1.0, 3.0, 7.0, 7.0, 9.0, 25.0, 33.0, 85.0, 123.0, 246.0, 238.0, 99.0, 49.0, 36.0, 12.0, 5.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5853729248046875, -2.5114989280700684, -2.4376251697540283, -2.363751173019409, -2.28987717628479, -2.21600341796875, -2.142129421234131, -2.0682554244995117, -1.9943815469741821, -1.9205076694488525, -1.8466336727142334, -1.7727597951889038, -1.6988859176635742, -1.625011920928955, -1.5511380434036255, -1.477264165878296, -1.4033901691436768, -1.3295162916183472, -1.255642294883728, -1.1817684173583984, -1.1078944206237793, -1.0340205430984497, -0.9601466655731201, -0.8862727284431458, -0.8123987913131714, -0.738524854183197, -0.6646509170532227, -0.5907770395278931, -0.5169031023979187, -0.44302916526794434, -0.36915525794029236, -0.2952813506126404, -0.22140741348266602, -0.14753349125385284, -0.07365956902503967, 0.00021435320377349854, 0.07408827543258667, 0.14796221256256104, 0.221836119890213, 0.295710027217865, 0.36958396434783936, 0.4434579014778137, 0.5173318386077881, 0.5912057161331177, 0.665079653263092, 0.7389535903930664, 0.812827467918396, 0.8867014050483704, 0.9605753421783447, 1.0344492197036743, 1.1083232164382935, 1.182197093963623, 1.2560710906982422, 1.3299449682235718, 1.4038188457489014, 1.4776928424835205, 1.55156672000885, 1.6254405975341797, 1.6993145942687988, 1.7731884717941284, 1.847062349319458, 1.9209363460540771, 1.9948102235794067, 2.0686841011047363, 2.1425580978393555]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 2.0, 4.0, 2.0, 3.0, 3.0, 9.0, 13.0, 7.0, 15.0, 16.0, 24.0, 17.0, 23.0, 33.0, 27.0, 37.0, 26.0, 26.0, 41.0, 64.0, 83.0, 106.0, 85.0, 50.0, 39.0, 32.0, 37.0, 28.0, 26.0, 22.0, 15.0, 17.0, 10.0, 6.0, 9.0, 9.0, 10.0, 13.0, 9.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6635791063308716, -1.611914038658142, -1.5602489709854126, -1.508583903312683, -1.4569188356399536, -1.4052537679672241, -1.3535887002944946, -1.3019236326217651, -1.2502585649490356, -1.1985934972763062, -1.1469284296035767, -1.0952633619308472, -1.0435982942581177, -0.9919332265853882, -0.9402681589126587, -0.8886030912399292, -0.8369379639625549, -0.7852728962898254, -0.733607828617096, -0.6819427609443665, -0.630277693271637, -0.5786125659942627, -0.5269474983215332, -0.4752824604511261, -0.4236173927783966, -0.3719523251056671, -0.3202872574329376, -0.26862215995788574, -0.21695710718631744, -0.16529202461242676, -0.11362695693969727, -0.06196188926696777, -0.010296821594238281, 0.04136824980378151, 0.0930333212018013, 0.1446983963251114, 0.19636346399784088, 0.24802854657173157, 0.29969361424446106, 0.35135868191719055, 0.40302374958992004, 0.45468881726264954, 0.5063539147377014, 0.5580189824104309, 0.6096840500831604, 0.6613491177558899, 0.7130141854286194, 0.7646792531013489, 0.8163443207740784, 0.8680093884468079, 0.9196744561195374, 0.9713395237922668, 1.0230046510696411, 1.0746697187423706, 1.1263347864151, 1.1779998540878296, 1.229664921760559, 1.2813299894332886, 1.332995057106018, 1.3846601247787476, 1.436325192451477, 1.4879902601242065, 1.539655327796936, 1.5913203954696655, 1.642985463142395]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 9.0, 11.0, 14.0, 21.0, 49.0, 107.0, 188.0, 383.0, 959.0, 2745.0, 10553.0, 65821.0, 1317007.0, 2630953.0, 143338.0, 15493.0, 4002.0, 1477.0, 595.0, 238.0, 128.0, 70.0, 35.0, 21.0, 16.0, 14.0, 9.0, 5.0, 8.0, 6.0, 5.0, 3.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.176513671875, -0.1692047119140625, -0.161895751953125, -0.1545867919921875, -0.14727783203125, -0.1399688720703125, -0.132659912109375, -0.1253509521484375, -0.1180419921875, -0.1107330322265625, -0.103424072265625, -0.0961151123046875, -0.08880615234375, -0.0814971923828125, -0.074188232421875, -0.0668792724609375, -0.0595703125, -0.0522613525390625, -0.044952392578125, -0.0376434326171875, -0.03033447265625, -0.0230255126953125, -0.015716552734375, -0.0084075927734375, -0.0010986328125, 0.0062103271484375, 0.013519287109375, 0.0208282470703125, 0.02813720703125, 0.0354461669921875, 0.042755126953125, 0.0500640869140625, 0.057373046875, 0.0646820068359375, 0.071990966796875, 0.0792999267578125, 0.08660888671875, 0.0939178466796875, 0.101226806640625, 0.1085357666015625, 0.1158447265625, 0.1231536865234375, 0.130462646484375, 0.1377716064453125, 0.14508056640625, 0.1523895263671875, 0.159698486328125, 0.1670074462890625, 0.17431640625, 0.1816253662109375, 0.188934326171875, 0.1962432861328125, 0.20355224609375, 0.2108612060546875, 0.218170166015625, 0.2254791259765625, 0.2327880859375, 0.2400970458984375, 0.247406005859375, 0.2547149658203125, 0.26202392578125, 0.2693328857421875, 0.276641845703125, 0.2839508056640625, 0.291259765625]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 5.0, 6.0, 8.0, 5.0, 6.0, 13.0, 14.0, 20.0, 30.0, 46.0, 46.0, 40.0, 67.0, 71.0, 66.0, 72.0, 64.0, 61.0, 67.0, 51.0, 50.0, 46.0, 42.0, 38.0, 22.0, 12.0, 10.0, 9.0, 8.0, 4.0, 4.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1400146484375, -0.13480186462402344, -0.12958908081054688, -0.12437629699707031, -0.11916351318359375, -0.11395072937011719, -0.10873794555664062, -0.10352516174316406, -0.0983123779296875, -0.09309959411621094, -0.08788681030273438, -0.08267402648925781, -0.07746124267578125, -0.07224845886230469, -0.06703567504882812, -0.06182289123535156, -0.056610107421875, -0.05139732360839844, -0.046184539794921875, -0.04097175598144531, -0.03575897216796875, -0.030546188354492188, -0.025333404541015625, -0.020120620727539062, -0.0149078369140625, -0.009695053100585938, -0.004482269287109375, 0.0007305145263671875, 0.00594329833984375, 0.011156082153320312, 0.016368865966796875, 0.021581649780273438, 0.02679443359375, 0.03200721740722656, 0.037220001220703125, 0.04243278503417969, 0.04764556884765625, 0.05285835266113281, 0.058071136474609375, 0.06328392028808594, 0.0684967041015625, 0.07370948791503906, 0.07892227172851562, 0.08413505554199219, 0.08934783935546875, 0.09456062316894531, 0.09977340698242188, 0.10498619079589844, 0.110198974609375, 0.11541175842285156, 0.12062454223632812, 0.1258373260498047, 0.13105010986328125, 0.1362628936767578, 0.14147567749023438, 0.14668846130371094, 0.1519012451171875, 0.15711402893066406, 0.16232681274414062, 0.1675395965576172, 0.17275238037109375, 0.1779651641845703, 0.18317794799804688, 0.18839073181152344, 0.193603515625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 5.0, 3.0, 7.0, 6.0, 15.0, 17.0, 32.0, 56.0, 122.0, 238.0, 564.0, 1816.0, 9665.0, 198325.0, 3904288.0, 71395.0, 5576.0, 1256.0, 434.0, 224.0, 96.0, 51.0, 40.0, 19.0, 8.0, 12.0, 5.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.4228515625, -0.4084587097167969, -0.39406585693359375, -0.3796730041503906, -0.3652801513671875, -0.3508872985839844, -0.33649444580078125, -0.3221015930175781, -0.307708740234375, -0.2933158874511719, -0.27892303466796875, -0.2645301818847656, -0.2501373291015625, -0.23574447631835938, -0.22135162353515625, -0.20695877075195312, -0.19256591796875, -0.17817306518554688, -0.16378021240234375, -0.14938735961914062, -0.1349945068359375, -0.12060165405273438, -0.10620880126953125, -0.09181594848632812, -0.077423095703125, -0.06303024291992188, -0.04863739013671875, -0.034244537353515625, -0.0198516845703125, -0.005458831787109375, 0.00893402099609375, 0.023326873779296875, 0.0377197265625, 0.052112579345703125, 0.06650543212890625, 0.08089828491210938, 0.0952911376953125, 0.10968399047851562, 0.12407684326171875, 0.13846969604492188, 0.152862548828125, 0.16725540161132812, 0.18164825439453125, 0.19604110717773438, 0.2104339599609375, 0.22482681274414062, 0.23921966552734375, 0.2536125183105469, 0.26800537109375, 0.2823982238769531, 0.29679107666015625, 0.3111839294433594, 0.3255767822265625, 0.3399696350097656, 0.35436248779296875, 0.3687553405761719, 0.383148193359375, 0.3975410461425781, 0.41193389892578125, 0.4263267517089844, 0.4407196044921875, 0.4551124572753906, 0.46950531005859375, 0.4838981628417969, 0.498291015625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 4.0, 7.0, 5.0, 9.0, 9.0, 21.0, 18.0, 21.0, 37.0, 50.0, 94.0, 99.0, 182.0, 312.0, 423.0, 602.0, 658.0, 509.0, 361.0, 215.0, 145.0, 95.0, 56.0, 42.0, 29.0, 20.0, 15.0, 13.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1890869140625, -0.18215370178222656, -0.17522048950195312, -0.1682872772216797, -0.16135406494140625, -0.1544208526611328, -0.14748764038085938, -0.14055442810058594, -0.1336212158203125, -0.12668800354003906, -0.11975479125976562, -0.11282157897949219, -0.10588836669921875, -0.09895515441894531, -0.09202194213867188, -0.08508872985839844, -0.078155517578125, -0.07122230529785156, -0.06428909301757812, -0.05735588073730469, -0.05042266845703125, -0.04348945617675781, -0.036556243896484375, -0.029623031616210938, -0.0226898193359375, -0.015756607055664062, -0.008823394775390625, -0.0018901824951171875, 0.00504302978515625, 0.011976242065429688, 0.018909454345703125, 0.025842666625976562, 0.03277587890625, 0.03970909118652344, 0.046642303466796875, 0.05357551574707031, 0.06050872802734375, 0.06744194030761719, 0.07437515258789062, 0.08130836486816406, 0.0882415771484375, 0.09517478942871094, 0.10210800170898438, 0.10904121398925781, 0.11597442626953125, 0.12290763854980469, 0.12984085083007812, 0.13677406311035156, 0.143707275390625, 0.15064048767089844, 0.15757369995117188, 0.1645069122314453, 0.17144012451171875, 0.1783733367919922, 0.18530654907226562, 0.19223976135253906, 0.1991729736328125, 0.20610618591308594, 0.21303939819335938, 0.2199726104736328, 0.22690582275390625, 0.2338390350341797, 0.24077224731445312, 0.24770545959472656, 0.254638671875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 9.0, 28.0, 48.0, 122.0, 211.0, 243.0, 178.0, 84.0, 43.0, 16.0, 7.0, 4.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.689993381500244, -4.591251850128174, -4.492509841918945, -4.393768310546875, -4.2950263023376465, -4.196284770965576, -4.097542762756348, -3.9988012313842773, -3.900059700012207, -3.8013179302215576, -3.702576160430908, -3.603834629058838, -3.5050928592681885, -3.406351089477539, -3.3076093196868896, -3.2088675498962402, -3.110125780105591, -3.0113840103149414, -2.912642240524292, -2.8139004707336426, -2.7151589393615723, -2.616417169570923, -2.5176753997802734, -2.418933629989624, -2.3201918601989746, -2.221450090408325, -2.122708320617676, -2.0239667892456055, -1.925225019454956, -1.8264832496643066, -1.7277414798736572, -1.6289997100830078, -1.5302579402923584, -1.431516170501709, -1.3327745199203491, -1.2340327501296997, -1.1352910995483398, -1.0365493297576904, -0.937807559967041, -0.8390658497810364, -0.7403241395950317, -0.6415824294090271, -0.5428407192230225, -0.44409894943237305, -0.3453572392463684, -0.24661552906036377, -0.14787375926971436, -0.04913204908370972, 0.04960966110229492, 0.14835138618946075, 0.2470931112766266, 0.3458348512649536, 0.44457656145095825, 0.5433182716369629, 0.6420600414276123, 0.7408017516136169, 0.8395434617996216, 0.9382851719856262, 1.0370268821716309, 1.1357686519622803, 1.2345104217529297, 1.3332520723342896, 1.431993842124939, 1.5307354927062988, 1.6294772624969482]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 6.0, 4.0, 13.0, 17.0, 10.0, 20.0, 18.0, 20.0, 22.0, 18.0, 36.0, 36.0, 46.0, 50.0, 47.0, 47.0, 55.0, 52.0, 51.0, 65.0, 48.0, 50.0, 34.0, 26.0, 39.0, 33.0, 23.0, 25.0, 19.0, 15.0, 14.0, 8.0, 9.0, 10.0, 5.0, 3.0, 2.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0728849172592163, -1.0371637344360352, -1.001442551612854, -0.9657214283943176, -0.9300003051757812, -0.8942791223526001, -0.858557939529419, -0.8228368163108826, -0.7871156930923462, -0.751394510269165, -0.7156733870506287, -0.6799522042274475, -0.6442310810089111, -0.60850989818573, -0.5727887153625488, -0.5370675921440125, -0.5013464093208313, -0.46562525629997253, -0.42990410327911377, -0.3941829204559326, -0.35846179723739624, -0.3227406144142151, -0.2870194613933563, -0.25129830837249756, -0.2155771553516388, -0.17985600233078003, -0.14413484930992126, -0.1084136813879013, -0.07269252836704254, -0.03697137534618378, -0.0012502074241638184, 0.034470945596694946, 0.07019209861755371, 0.10591325163841248, 0.14163440465927124, 0.1773555725812912, 0.21307672560214996, 0.24879787862300873, 0.2845190465450287, 0.32024019956588745, 0.3559613525867462, 0.391682505607605, 0.42740365862846375, 0.4631248116493225, 0.49884599447250366, 0.53456711769104, 0.5702883005142212, 0.6060094833374023, 0.6417306065559387, 0.6774517893791199, 0.7131729125976562, 0.7488940954208374, 0.7846152186393738, 0.8203364014625549, 0.8560575246810913, 0.8917787075042725, 0.9274998903274536, 0.9632210731506348, 0.9989421963691711, 1.0346633195877075, 1.0703845024108887, 1.1061056852340698, 1.141826868057251, 1.1775479316711426, 1.2132691144943237]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 4.0, 3.0, 7.0, 6.0, 11.0, 23.0, 24.0, 31.0, 41.0, 108.0, 138.0, 285.0, 597.0, 1109.0, 2907.0, 7747.0, 24772.0, 93797.0, 406248.0, 386518.0, 88075.0, 23259.0, 7563.0, 2822.0, 1235.0, 559.0, 285.0, 125.0, 88.0, 56.0, 28.0, 31.0, 16.0, 11.0, 6.0, 4.0, 5.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.212890625, -0.2068042755126953, -0.20071792602539062, -0.19463157653808594, -0.18854522705078125, -0.18245887756347656, -0.17637252807617188, -0.1702861785888672, -0.1641998291015625, -0.1581134796142578, -0.15202713012695312, -0.14594078063964844, -0.13985443115234375, -0.13376808166503906, -0.12768173217773438, -0.12159538269042969, -0.115509033203125, -0.10942268371582031, -0.10333633422851562, -0.09724998474121094, -0.09116363525390625, -0.08507728576660156, -0.07899093627929688, -0.07290458679199219, -0.0668182373046875, -0.06073188781738281, -0.054645538330078125, -0.04855918884277344, -0.04247283935546875, -0.03638648986816406, -0.030300140380859375, -0.024213790893554688, -0.01812744140625, -0.012041091918945312, -0.005954742431640625, 0.0001316070556640625, 0.00621795654296875, 0.012304306030273438, 0.018390655517578125, 0.024477005004882812, 0.0305633544921875, 0.03664970397949219, 0.042736053466796875, 0.04882240295410156, 0.05490875244140625, 0.06099510192871094, 0.06708145141601562, 0.07316780090332031, 0.079254150390625, 0.08534049987792969, 0.09142684936523438, 0.09751319885253906, 0.10359954833984375, 0.10968589782714844, 0.11577224731445312, 0.12185859680175781, 0.1279449462890625, 0.1340312957763672, 0.14011764526367188, 0.14620399475097656, 0.15229034423828125, 0.15837669372558594, 0.16446304321289062, 0.1705493927001953, 0.1766357421875]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 7.0, 6.0, 5.0, 9.0, 19.0, 18.0, 27.0, 39.0, 46.0, 50.0, 55.0, 62.0, 64.0, 57.0, 72.0, 69.0, 56.0, 46.0, 60.0, 46.0, 33.0, 28.0, 27.0, 24.0, 23.0, 15.0, 11.0, 5.0, 4.0, 7.0, 4.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1419677734375, -0.1368236541748047, -0.13167953491210938, -0.12653541564941406, -0.12139129638671875, -0.11624717712402344, -0.11110305786132812, -0.10595893859863281, -0.1008148193359375, -0.09567070007324219, -0.09052658081054688, -0.08538246154785156, -0.08023834228515625, -0.07509422302246094, -0.06995010375976562, -0.06480598449707031, -0.059661865234375, -0.05451774597167969, -0.049373626708984375, -0.04422950744628906, -0.03908538818359375, -0.03394126892089844, -0.028797149658203125, -0.023653030395507812, -0.0185089111328125, -0.013364791870117188, -0.008220672607421875, -0.0030765533447265625, 0.00206756591796875, 0.0072116851806640625, 0.012355804443359375, 0.017499923706054688, 0.02264404296875, 0.027788162231445312, 0.032932281494140625, 0.03807640075683594, 0.04322052001953125, 0.04836463928222656, 0.053508758544921875, 0.05865287780761719, 0.0637969970703125, 0.06894111633300781, 0.07408523559570312, 0.07922935485839844, 0.08437347412109375, 0.08951759338378906, 0.09466171264648438, 0.09980583190917969, 0.104949951171875, 0.11009407043457031, 0.11523818969726562, 0.12038230895996094, 0.12552642822265625, 0.13067054748535156, 0.13581466674804688, 0.1409587860107422, 0.1461029052734375, 0.1512470245361328, 0.15639114379882812, 0.16153526306152344, 0.16667938232421875, 0.17182350158691406, 0.17696762084960938, 0.1821117401123047, 0.187255859375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 7.0, 5.0, 4.0, 12.0, 17.0, 19.0, 21.0, 36.0, 52.0, 69.0, 92.0, 190.0, 318.0, 518.0, 1200.0, 3530.0, 20933.0, 435219.0, 558414.0, 21711.0, 3589.0, 1207.0, 583.0, 325.0, 165.0, 95.0, 77.0, 63.0, 30.0, 17.0, 9.0, 3.0, 8.0, 8.0, 7.0, 3.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4365234375, -0.4236869812011719, -0.41085052490234375, -0.3980140686035156, -0.3851776123046875, -0.3723411560058594, -0.35950469970703125, -0.3466682434082031, -0.333831787109375, -0.3209953308105469, -0.30815887451171875, -0.2953224182128906, -0.2824859619140625, -0.2696495056152344, -0.25681304931640625, -0.24397659301757812, -0.23114013671875, -0.21830368041992188, -0.20546722412109375, -0.19263076782226562, -0.1797943115234375, -0.16695785522460938, -0.15412139892578125, -0.14128494262695312, -0.128448486328125, -0.11561203002929688, -0.10277557373046875, -0.08993911743164062, -0.0771026611328125, -0.06426620483398438, -0.05142974853515625, -0.038593292236328125, -0.0257568359375, -0.012920379638671875, -8.392333984375e-05, 0.012752532958984375, 0.0255889892578125, 0.038425445556640625, 0.05126190185546875, 0.06409835815429688, 0.076934814453125, 0.08977127075195312, 0.10260772705078125, 0.11544418334960938, 0.1282806396484375, 0.14111709594726562, 0.15395355224609375, 0.16679000854492188, 0.17962646484375, 0.19246292114257812, 0.20529937744140625, 0.21813583374023438, 0.2309722900390625, 0.24380874633789062, 0.25664520263671875, 0.2694816589355469, 0.282318115234375, 0.2951545715332031, 0.30799102783203125, 0.3208274841308594, 0.3336639404296875, 0.3465003967285156, 0.35933685302734375, 0.3721733093261719, 0.385009765625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 9.0, 6.0, 5.0, 13.0, 9.0, 13.0, 34.0, 29.0, 37.0, 38.0, 37.0, 64.0, 63.0, 59.0, 74.0, 78.0, 65.0, 61.0, 50.0, 45.0, 41.0, 41.0, 28.0, 23.0, 26.0, 10.0, 12.0, 7.0, 7.0, 4.0, 2.0, 5.0, 3.0, 2.0, 4.0, 0.0, 3.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.67041015625, -0.6506729125976562, -0.6309356689453125, -0.6111984252929688, -0.591461181640625, -0.5717239379882812, -0.5519866943359375, -0.5322494506835938, -0.51251220703125, -0.49277496337890625, -0.4730377197265625, -0.45330047607421875, -0.433563232421875, -0.41382598876953125, -0.3940887451171875, -0.37435150146484375, -0.3546142578125, -0.33487701416015625, -0.3151397705078125, -0.29540252685546875, -0.275665283203125, -0.25592803955078125, -0.2361907958984375, -0.21645355224609375, -0.19671630859375, -0.17697906494140625, -0.1572418212890625, -0.13750457763671875, -0.117767333984375, -0.09803009033203125, -0.0782928466796875, -0.05855560302734375, -0.038818359375, -0.01908111572265625, 0.0006561279296875, 0.02039337158203125, 0.040130615234375, 0.05986785888671875, 0.0796051025390625, 0.09934234619140625, 0.11907958984375, 0.13881683349609375, 0.1585540771484375, 0.17829132080078125, 0.198028564453125, 0.21776580810546875, 0.2375030517578125, 0.25724029541015625, 0.2769775390625, 0.29671478271484375, 0.3164520263671875, 0.33618927001953125, 0.355926513671875, 0.37566375732421875, 0.3954010009765625, 0.41513824462890625, 0.43487548828125, 0.45461273193359375, 0.4743499755859375, 0.49408721923828125, 0.513824462890625, 0.5335617065429688, 0.5532989501953125, 0.5730361938476562, 0.5927734375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 6.0, 5.0, 10.0, 8.0, 17.0, 20.0, 22.0, 38.0, 76.0, 109.0, 181.0, 318.0, 602.0, 1454.0, 3683.0, 11631.0, 50855.0, 757821.0, 183913.0, 26238.0, 7046.0, 2404.0, 948.0, 511.0, 249.0, 130.0, 79.0, 47.0, 37.0, 21.0, 22.0, 18.0, 7.0, 10.0, 5.0, 4.0, 2.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1136474609375, -0.10995674133300781, -0.10626602172851562, -0.10257530212402344, -0.09888458251953125, -0.09519386291503906, -0.09150314331054688, -0.08781242370605469, -0.0841217041015625, -0.08043098449707031, -0.07674026489257812, -0.07304954528808594, -0.06935882568359375, -0.06566810607910156, -0.061977386474609375, -0.05828666687011719, -0.054595947265625, -0.05090522766113281, -0.047214508056640625, -0.04352378845214844, -0.03983306884765625, -0.03614234924316406, -0.032451629638671875, -0.028760910034179688, -0.0250701904296875, -0.021379470825195312, -0.017688751220703125, -0.013998031616210938, -0.01030731201171875, -0.0066165924072265625, -0.002925872802734375, 0.0007648468017578125, 0.00445556640625, 0.008146286010742188, 0.011837005615234375, 0.015527725219726562, 0.01921844482421875, 0.022909164428710938, 0.026599884033203125, 0.030290603637695312, 0.0339813232421875, 0.03767204284667969, 0.041362762451171875, 0.04505348205566406, 0.04874420166015625, 0.05243492126464844, 0.056125640869140625, 0.05981636047363281, 0.063507080078125, 0.06719779968261719, 0.07088851928710938, 0.07457923889160156, 0.07826995849609375, 0.08196067810058594, 0.08565139770507812, 0.08934211730957031, 0.0930328369140625, 0.09672355651855469, 0.10041427612304688, 0.10410499572753906, 0.10779571533203125, 0.11148643493652344, 0.11517715454101562, 0.11886787414550781, 0.12255859375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 6.0, 10.0, 4.0, 5.0, 6.0, 10.0, 20.0, 11.0, 17.0, 17.0, 37.0, 43.0, 64.0, 58.0, 80.0, 68.0, 78.0, 82.0, 75.0, 54.0, 51.0, 48.0, 27.0, 30.0, 20.0, 20.0, 10.0, 5.0, 5.0, 8.0, 8.0, 6.0, 3.0, 1.0, 4.0, 3.0, 5.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.8789043426513672e-05, -2.7704983949661255e-05, -2.6620924472808838e-05, -2.553686499595642e-05, -2.4452805519104004e-05, -2.3368746042251587e-05, -2.228468656539917e-05, -2.1200627088546753e-05, -2.0116567611694336e-05, -1.903250813484192e-05, -1.7948448657989502e-05, -1.6864389181137085e-05, -1.5780329704284668e-05, -1.4696270227432251e-05, -1.3612210750579834e-05, -1.2528151273727417e-05, -1.1444091796875e-05, -1.0360032320022583e-05, -9.275972843170166e-06, -8.191913366317749e-06, -7.107853889465332e-06, -6.023794412612915e-06, -4.939734935760498e-06, -3.855675458908081e-06, -2.771615982055664e-06, -1.687556505203247e-06, -6.034970283508301e-07, 4.805624485015869e-07, 1.564621925354004e-06, 2.648681402206421e-06, 3.732740879058838e-06, 4.816800355911255e-06, 5.900859832763672e-06, 6.984919309616089e-06, 8.068978786468506e-06, 9.153038263320923e-06, 1.023709774017334e-05, 1.1321157217025757e-05, 1.2405216693878174e-05, 1.348927617073059e-05, 1.4573335647583008e-05, 1.5657395124435425e-05, 1.6741454601287842e-05, 1.782551407814026e-05, 1.8909573554992676e-05, 1.9993633031845093e-05, 2.107769250869751e-05, 2.2161751985549927e-05, 2.3245811462402344e-05, 2.432987093925476e-05, 2.5413930416107178e-05, 2.6497989892959595e-05, 2.7582049369812012e-05, 2.866610884666443e-05, 2.9750168323516846e-05, 3.083422780036926e-05, 3.191828727722168e-05, 3.30023467540741e-05, 3.4086406230926514e-05, 3.517046570777893e-05, 3.625452518463135e-05, 3.7338584661483765e-05, 3.842264413833618e-05, 3.95067036151886e-05, 4.0590763092041016e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 5.0, 0.0, 5.0, 11.0, 14.0, 13.0, 15.0, 27.0, 54.0, 64.0, 129.0, 256.0, 489.0, 1246.0, 3837.0, 16357.0, 123464.0, 826996.0, 60678.0, 10548.0, 2571.0, 891.0, 396.0, 201.0, 112.0, 64.0, 35.0, 24.0, 19.0, 13.0, 9.0, 7.0, 4.0, 5.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.138427734375, -0.13401222229003906, -0.12959671020507812, -0.1251811981201172, -0.12076568603515625, -0.11635017395019531, -0.11193466186523438, -0.10751914978027344, -0.1031036376953125, -0.09868812561035156, -0.09427261352539062, -0.08985710144042969, -0.08544158935546875, -0.08102607727050781, -0.07661056518554688, -0.07219505310058594, -0.067779541015625, -0.06336402893066406, -0.058948516845703125, -0.05453300476074219, -0.05011749267578125, -0.04570198059082031, -0.041286468505859375, -0.03687095642089844, -0.0324554443359375, -0.028039932250976562, -0.023624420166015625, -0.019208908081054688, -0.01479339599609375, -0.010377883911132812, -0.005962371826171875, -0.0015468597412109375, 0.00286865234375, 0.0072841644287109375, 0.011699676513671875, 0.016115188598632812, 0.02053070068359375, 0.024946212768554688, 0.029361724853515625, 0.03377723693847656, 0.0381927490234375, 0.04260826110839844, 0.047023773193359375, 0.05143928527832031, 0.05585479736328125, 0.06027030944824219, 0.06468582153320312, 0.06910133361816406, 0.073516845703125, 0.07793235778808594, 0.08234786987304688, 0.08676338195800781, 0.09117889404296875, 0.09559440612792969, 0.10000991821289062, 0.10442543029785156, 0.1088409423828125, 0.11325645446777344, 0.11767196655273438, 0.12208747863769531, 0.12650299072265625, 0.1309185028076172, 0.13533401489257812, 0.13974952697753906, 0.1441650390625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 2.0, 6.0, 6.0, 7.0, 6.0, 4.0, 16.0, 16.0, 20.0, 33.0, 30.0, 57.0, 89.0, 95.0, 161.0, 134.0, 99.0, 64.0, 42.0, 23.0, 20.0, 25.0, 8.0, 10.0, 8.0, 8.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.123046875, -0.1194000244140625, -0.115753173828125, -0.1121063232421875, -0.10845947265625, -0.1048126220703125, -0.101165771484375, -0.0975189208984375, -0.0938720703125, -0.0902252197265625, -0.086578369140625, -0.0829315185546875, -0.07928466796875, -0.0756378173828125, -0.071990966796875, -0.0683441162109375, -0.064697265625, -0.0610504150390625, -0.057403564453125, -0.0537567138671875, -0.05010986328125, -0.0464630126953125, -0.042816162109375, -0.0391693115234375, -0.0355224609375, -0.0318756103515625, -0.028228759765625, -0.0245819091796875, -0.02093505859375, -0.0172882080078125, -0.013641357421875, -0.0099945068359375, -0.00634765625, -0.0027008056640625, 0.000946044921875, 0.0045928955078125, 0.00823974609375, 0.0118865966796875, 0.015533447265625, 0.0191802978515625, 0.0228271484375, 0.0264739990234375, 0.030120849609375, 0.0337677001953125, 0.03741455078125, 0.0410614013671875, 0.044708251953125, 0.0483551025390625, 0.052001953125, 0.0556488037109375, 0.059295654296875, 0.0629425048828125, 0.06658935546875, 0.0702362060546875, 0.073883056640625, 0.0775299072265625, 0.0811767578125, 0.0848236083984375, 0.088470458984375, 0.0921173095703125, 0.09576416015625, 0.0994110107421875, 0.103057861328125, 0.1067047119140625, 0.1103515625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 8.0, 11.0, 39.0, 138.0, 534.0, 191.0, 54.0, 15.0, 7.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.045783996582031, -5.881122589111328, -5.716460704803467, -5.551799297332764, -5.3871378898620605, -5.222476005554199, -5.057814598083496, -4.893153190612793, -4.72849178314209, -4.563830375671387, -4.399168491363525, -4.234507083892822, -4.069845676422119, -3.905184030532837, -3.7405223846435547, -3.5758609771728516, -3.4111990928649902, -3.246537446975708, -3.081876039505005, -2.9172143936157227, -2.7525529861450195, -2.5878913402557373, -2.423229694366455, -2.258568286895752, -2.0939066410064697, -1.929245114326477, -1.7645835876464844, -1.5999219417572021, -1.4352604150772095, -1.2705988883972168, -1.1059372425079346, -0.9412757158279419, -0.776613712310791, -0.6119521856307983, -0.4472905993461609, -0.2826290428638458, -0.11796748638153076, 0.046694040298461914, 0.21135562658309937, 0.3760172128677368, 0.5406787395477295, 0.7053402662277222, 0.8700018525123596, 1.034663438796997, 1.1993249654769897, 1.3639864921569824, 1.5286481380462646, 1.6933096647262573, 1.85797119140625, 2.0226328372955322, 2.1872942447662354, 2.3519558906555176, 2.5166172981262207, 2.681278944015503, 2.845940589904785, 3.0106019973754883, 3.1752636432647705, 3.3399252891540527, 3.504586696624756, 3.669248342514038, 3.8339099884033203, 3.9985713958740234, 4.163232803344727, 4.327894687652588, 4.492556095123291]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 7.0, 5.0, 6.0, 9.0, 5.0, 11.0, 10.0, 23.0, 15.0, 19.0, 19.0, 15.0, 26.0, 22.0, 24.0, 37.0, 47.0, 80.0, 156.0, 122.0, 63.0, 32.0, 29.0, 25.0, 37.0, 20.0, 13.0, 19.0, 16.0, 21.0, 15.0, 19.0, 10.0, 3.0, 4.0, 7.0, 3.0, 6.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.999355435371399, -1.9382165670394897, -1.8770778179168701, -1.815938949584961, -1.7548000812530518, -1.6936612129211426, -1.632522463798523, -1.5713835954666138, -1.5102448463439941, -1.449105978012085, -1.3879672288894653, -1.3268283605575562, -1.265689492225647, -1.2045507431030273, -1.1434118747711182, -1.082273006439209, -1.0211341381072998, -0.9599953293800354, -0.8988564610481262, -0.8377176523208618, -0.7765787839889526, -0.7154399752616882, -0.6543011665344238, -0.5931622982025146, -0.5320234894752502, -0.47088465094566345, -0.40974581241607666, -0.34860700368881226, -0.28746816515922546, -0.22632932662963867, -0.16519051790237427, -0.10405167937278748, -0.042912960052490234, 0.01822587102651596, 0.07936470210552216, 0.14050352573394775, 0.20164236426353455, 0.26278120279312134, 0.32392001152038574, 0.38505885004997253, 0.4461976885795593, 0.5073364973068237, 0.5684753656387329, 0.6296141743659973, 0.6907529830932617, 0.7518918514251709, 0.8130306601524353, 0.8741694688796997, 0.9353083372116089, 0.9964471459388733, 1.0575859546661377, 1.1187248229980469, 1.179863691329956, 1.2410025596618652, 1.3021413087844849, 1.363280177116394, 1.4244189262390137, 1.4855577945709229, 1.5466965436935425, 1.6078354120254517, 1.6689742803573608, 1.7301130294799805, 1.7912518978118896, 1.8523907661437988, 1.913529634475708]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 5.0, 7.0, 8.0, 6.0, 15.0, 20.0, 27.0, 57.0, 119.0, 242.0, 489.0, 1202.0, 3312.0, 11317.0, 68823.0, 953711.0, 2773752.0, 341210.0, 30017.0, 6442.0, 2046.0, 795.0, 342.0, 133.0, 81.0, 38.0, 23.0, 17.0, 9.0, 6.0, 3.0, 1.0, 8.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.306396484375, -0.29628753662109375, -0.2861785888671875, -0.27606964111328125, -0.265960693359375, -0.25585174560546875, -0.2457427978515625, -0.23563385009765625, -0.22552490234375, -0.21541595458984375, -0.2053070068359375, -0.19519805908203125, -0.185089111328125, -0.17498016357421875, -0.1648712158203125, -0.15476226806640625, -0.1446533203125, -0.13454437255859375, -0.1244354248046875, -0.11432647705078125, -0.104217529296875, -0.09410858154296875, -0.0839996337890625, -0.07389068603515625, -0.06378173828125, -0.05367279052734375, -0.0435638427734375, -0.03345489501953125, -0.023345947265625, -0.01323699951171875, -0.0031280517578125, 0.00698089599609375, 0.01708984375, 0.02719879150390625, 0.0373077392578125, 0.04741668701171875, 0.057525634765625, 0.06763458251953125, 0.0777435302734375, 0.08785247802734375, 0.09796142578125, 0.10807037353515625, 0.1181793212890625, 0.12828826904296875, 0.138397216796875, 0.14850616455078125, 0.1586151123046875, 0.16872406005859375, 0.1788330078125, 0.18894195556640625, 0.1990509033203125, 0.20915985107421875, 0.219268798828125, 0.22937774658203125, 0.2394866943359375, 0.24959564208984375, 0.25970458984375, 0.26981353759765625, 0.2799224853515625, 0.29003143310546875, 0.300140380859375, 0.31024932861328125, 0.3203582763671875, 0.33046722412109375, 0.340576171875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 3.0, 1.0, 4.0, 4.0, 4.0, 3.0, 3.0, 9.0, 11.0, 10.0, 17.0, 37.0, 38.0, 46.0, 47.0, 46.0, 50.0, 55.0, 61.0, 74.0, 65.0, 54.0, 52.0, 49.0, 51.0, 49.0, 22.0, 37.0, 23.0, 19.0, 16.0, 11.0, 13.0, 8.0, 5.0, 5.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1346435546875, -0.12982749938964844, -0.12501144409179688, -0.12019538879394531, -0.11537933349609375, -0.11056327819824219, -0.10574722290039062, -0.10093116760253906, -0.0961151123046875, -0.09129905700683594, -0.08648300170898438, -0.08166694641113281, -0.07685089111328125, -0.07203483581542969, -0.06721878051757812, -0.06240272521972656, -0.057586669921875, -0.05277061462402344, -0.047954559326171875, -0.04313850402832031, -0.03832244873046875, -0.03350639343261719, -0.028690338134765625, -0.023874282836914062, -0.0190582275390625, -0.014242172241210938, -0.009426116943359375, -0.0046100616455078125, 0.00020599365234375, 0.0050220489501953125, 0.009838104248046875, 0.014654159545898438, 0.01947021484375, 0.024286270141601562, 0.029102325439453125, 0.03391838073730469, 0.03873443603515625, 0.04355049133300781, 0.048366546630859375, 0.05318260192871094, 0.0579986572265625, 0.06281471252441406, 0.06763076782226562, 0.07244682312011719, 0.07726287841796875, 0.08207893371582031, 0.08689498901367188, 0.09171104431152344, 0.096527099609375, 0.10134315490722656, 0.10615921020507812, 0.11097526550292969, 0.11579132080078125, 0.12060737609863281, 0.12542343139648438, 0.13023948669433594, 0.1350555419921875, 0.13987159729003906, 0.14468765258789062, 0.1495037078857422, 0.15431976318359375, 0.1591358184814453, 0.16395187377929688, 0.16876792907714844, 0.173583984375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 5.0, 7.0, 12.0, 25.0, 39.0, 103.0, 307.0, 866.0, 3695.0, 1578189.0, 2605820.0, 3889.0, 865.0, 262.0, 92.0, 46.0, 21.0, 10.0, 7.0, 9.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8935546875, -1.8361968994140625, -1.778839111328125, -1.7214813232421875, -1.66412353515625, -1.6067657470703125, -1.549407958984375, -1.4920501708984375, -1.4346923828125, -1.3773345947265625, -1.319976806640625, -1.2626190185546875, -1.20526123046875, -1.1479034423828125, -1.090545654296875, -1.0331878662109375, -0.975830078125, -0.9184722900390625, -0.861114501953125, -0.8037567138671875, -0.74639892578125, -0.6890411376953125, -0.631683349609375, -0.5743255615234375, -0.5169677734375, -0.4596099853515625, -0.402252197265625, -0.3448944091796875, -0.28753662109375, -0.2301788330078125, -0.172821044921875, -0.1154632568359375, -0.05810546875, -0.0007476806640625, 0.056610107421875, 0.1139678955078125, 0.17132568359375, 0.2286834716796875, 0.286041259765625, 0.3433990478515625, 0.4007568359375, 0.4581146240234375, 0.515472412109375, 0.5728302001953125, 0.63018798828125, 0.6875457763671875, 0.744903564453125, 0.8022613525390625, 0.859619140625, 0.9169769287109375, 0.974334716796875, 1.0316925048828125, 1.08905029296875, 1.1464080810546875, 1.203765869140625, 1.2611236572265625, 1.3184814453125, 1.3758392333984375, 1.433197021484375, 1.4905548095703125, 1.54791259765625, 1.6052703857421875, 1.662628173828125, 1.7199859619140625, 1.77734375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 7.0, 5.0, 15.0, 43.0, 102.0, 310.0, 838.0, 1516.0, 736.0, 309.0, 118.0, 48.0, 14.0, 14.0, 6.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0908203125, -1.054962158203125, -1.01910400390625, -0.983245849609375, -0.9473876953125, -0.911529541015625, -0.87567138671875, -0.839813232421875, -0.803955078125, -0.768096923828125, -0.73223876953125, -0.696380615234375, -0.6605224609375, -0.624664306640625, -0.58880615234375, -0.552947998046875, -0.51708984375, -0.481231689453125, -0.44537353515625, -0.409515380859375, -0.3736572265625, -0.337799072265625, -0.30194091796875, -0.266082763671875, -0.230224609375, -0.194366455078125, -0.15850830078125, -0.122650146484375, -0.0867919921875, -0.050933837890625, -0.01507568359375, 0.020782470703125, 0.056640625, 0.092498779296875, 0.12835693359375, 0.164215087890625, 0.2000732421875, 0.235931396484375, 0.27178955078125, 0.307647705078125, 0.343505859375, 0.379364013671875, 0.41522216796875, 0.451080322265625, 0.4869384765625, 0.522796630859375, 0.55865478515625, 0.594512939453125, 0.63037109375, 0.666229248046875, 0.70208740234375, 0.737945556640625, 0.7738037109375, 0.809661865234375, 0.84552001953125, 0.881378173828125, 0.917236328125, 0.953094482421875, 0.98895263671875, 1.024810791015625, 1.0606689453125, 1.096527099609375, 1.13238525390625, 1.168243408203125, 1.2041015625]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 8.0, 5.0, 8.0, 12.0, 21.0, 60.0, 173.0, 293.0, 242.0, 102.0, 35.0, 18.0, 10.0, 2.0, 9.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-11.934843063354492, -11.661642074584961, -11.388440132141113, -11.115239143371582, -10.84203815460205, -10.56883716583252, -10.295635223388672, -10.02243423461914, -9.74923324584961, -9.476032257080078, -9.20283031463623, -8.9296293258667, -8.656428337097168, -8.383227348327637, -8.110025405883789, -7.836824417114258, -7.563622951507568, -7.290421485900879, -7.017220497131348, -6.744019031524658, -6.470818042755127, -6.1976165771484375, -5.924415588378906, -5.651214122772217, -5.378012657165527, -5.104811191558838, -4.831610202789307, -4.558408737182617, -4.285207748413086, -4.0120062828063965, -3.738805055618286, -3.465603828430176, -3.1924033164978027, -2.9192020893096924, -2.646000862121582, -2.3727993965148926, -2.0995984077453613, -1.8263970613479614, -1.5531957149505615, -1.2799944877624512, -1.0067932605743408, -0.7335920333862305, -0.46039074659347534, -0.18718945980072021, 0.08601176738739014, 0.3592129945755005, 0.6324143409729004, 0.9056155681610107, 1.178816795349121, 1.4520180225372314, 1.7252192497253418, 1.9984205961227417, 2.2716217041015625, 2.544823169708252, 2.8180243968963623, 3.0912256240844727, 3.364426851272583, 3.6376280784606934, 3.9108293056488037, 4.184030532836914, 4.4572319984436035, 4.730432987213135, 5.003634452819824, 5.2768354415893555, 5.550036907196045]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 4.0, 4.0, 11.0, 10.0, 9.0, 19.0, 32.0, 34.0, 46.0, 50.0, 51.0, 75.0, 77.0, 81.0, 85.0, 76.0, 69.0, 57.0, 51.0, 44.0, 33.0, 25.0, 15.0, 12.0, 12.0, 8.0, 5.0, 5.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.180706024169922, -4.055411338806152, -3.930116653442383, -3.8048219680786133, -3.6795272827148438, -3.554232597351074, -3.4289379119873047, -3.303643226623535, -3.1783485412597656, -3.053053855895996, -2.9277591705322266, -2.802464485168457, -2.6771697998046875, -2.551875114440918, -2.4265804290771484, -2.301285743713379, -2.1759908199310303, -2.0506961345672607, -1.9254014492034912, -1.8001067638397217, -1.6748120784759521, -1.5495173931121826, -1.4242225885391235, -1.298927903175354, -1.1736332178115845, -1.048338532447815, -0.9230438470840454, -0.7977491021156311, -0.6724544167518616, -0.547159731388092, -0.42186498641967773, -0.2965703010559082, -0.17127585411071777, -0.04598115384578705, 0.07931354641914368, 0.2046082615852356, 0.3299029469490051, 0.45519763231277466, 0.580492377281189, 0.7057870626449585, 0.831081748008728, 0.9563764333724976, 1.081671118736267, 1.2069659233093262, 1.3322606086730957, 1.4575552940368652, 1.5828499794006348, 1.7081446647644043, 1.8334393501281738, 1.9587340354919434, 2.084028720855713, 2.2093234062194824, 2.334618091583252, 2.4599127769470215, 2.585207462310791, 2.7105021476745605, 2.83579683303833, 2.9610915184020996, 3.086386203765869, 3.2116808891296387, 3.336975574493408, 3.4622702598571777, 3.5875649452209473, 3.712859630584717, 3.8381545543670654]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 6.0, 10.0, 15.0, 11.0, 25.0, 30.0, 47.0, 64.0, 104.0, 183.0, 367.0, 713.0, 1497.0, 3748.0, 11624.0, 51199.0, 502429.0, 413856.0, 45579.0, 10737.0, 3428.0, 1396.0, 656.0, 319.0, 201.0, 120.0, 67.0, 50.0, 21.0, 18.0, 11.0, 5.0, 7.0, 1.0, 4.0, 2.0, 0.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.33935546875, -0.33017539978027344, -0.3209953308105469, -0.3118152618408203, -0.30263519287109375, -0.2934551239013672, -0.2842750549316406, -0.27509498596191406, -0.2659149169921875, -0.25673484802246094, -0.24755477905273438, -0.2383747100830078, -0.22919464111328125, -0.2200145721435547, -0.21083450317382812, -0.20165443420410156, -0.192474365234375, -0.18329429626464844, -0.17411422729492188, -0.1649341583251953, -0.15575408935546875, -0.1465740203857422, -0.13739395141601562, -0.12821388244628906, -0.1190338134765625, -0.10985374450683594, -0.10067367553710938, -0.09149360656738281, -0.08231353759765625, -0.07313346862792969, -0.06395339965820312, -0.05477333068847656, -0.04559326171875, -0.03641319274902344, -0.027233123779296875, -0.018053054809570312, -0.00887298583984375, 0.0003070831298828125, 0.009487152099609375, 0.018667221069335938, 0.0278472900390625, 0.03702735900878906, 0.046207427978515625, 0.05538749694824219, 0.06456756591796875, 0.07374763488769531, 0.08292770385742188, 0.09210777282714844, 0.101287841796875, 0.11046791076660156, 0.11964797973632812, 0.1288280487060547, 0.13800811767578125, 0.1471881866455078, 0.15636825561523438, 0.16554832458496094, 0.1747283935546875, 0.18390846252441406, 0.19308853149414062, 0.2022686004638672, 0.21144866943359375, 0.2206287384033203, 0.22980880737304688, 0.23898887634277344, 0.2481689453125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 5.0, 6.0, 14.0, 14.0, 20.0, 28.0, 46.0, 55.0, 67.0, 95.0, 89.0, 110.0, 91.0, 84.0, 65.0, 59.0, 48.0, 34.0, 22.0, 14.0, 11.0, 7.0, 4.0, 5.0, 1.0, 2.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2958984375, -0.2862892150878906, -0.27667999267578125, -0.2670707702636719, -0.2574615478515625, -0.24785232543945312, -0.23824310302734375, -0.22863388061523438, -0.219024658203125, -0.20941543579101562, -0.19980621337890625, -0.19019699096679688, -0.1805877685546875, -0.17097854614257812, -0.16136932373046875, -0.15176010131835938, -0.14215087890625, -0.13254165649414062, -0.12293243408203125, -0.11332321166992188, -0.1037139892578125, -0.09410476684570312, -0.08449554443359375, -0.07488632202148438, -0.065277099609375, -0.055667877197265625, -0.04605865478515625, -0.036449432373046875, -0.0268402099609375, -0.017230987548828125, -0.00762176513671875, 0.001987457275390625, 0.0115966796875, 0.021205902099609375, 0.03081512451171875, 0.040424346923828125, 0.0500335693359375, 0.059642791748046875, 0.06925201416015625, 0.07886123657226562, 0.088470458984375, 0.09807968139648438, 0.10768890380859375, 0.11729812622070312, 0.1269073486328125, 0.13651657104492188, 0.14612579345703125, 0.15573501586914062, 0.16534423828125, 0.17495346069335938, 0.18456268310546875, 0.19417190551757812, 0.2037811279296875, 0.21339035034179688, 0.22299957275390625, 0.23260879516601562, 0.242218017578125, 0.2518272399902344, 0.26143646240234375, 0.2710456848144531, 0.2806549072265625, 0.2902641296386719, 0.29987335205078125, 0.3094825744628906, 0.319091796875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 7.0, 7.0, 5.0, 7.0, 6.0, 8.0, 17.0, 15.0, 23.0, 32.0, 36.0, 32.0, 49.0, 91.0, 126.0, 227.0, 338.0, 602.0, 1354.0, 4501.0, 28721.0, 858675.0, 136931.0, 11943.0, 2585.0, 911.0, 471.0, 262.0, 162.0, 91.0, 80.0, 54.0, 49.0, 27.0, 24.0, 19.0, 10.0, 14.0, 9.0, 9.0, 7.0, 4.0, 5.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0], "bins": [-0.3359375, -0.32537078857421875, -0.3148040771484375, -0.30423736572265625, -0.293670654296875, -0.28310394287109375, -0.2725372314453125, -0.26197052001953125, -0.25140380859375, -0.24083709716796875, -0.2302703857421875, -0.21970367431640625, -0.209136962890625, -0.19857025146484375, -0.1880035400390625, -0.17743682861328125, -0.1668701171875, -0.15630340576171875, -0.1457366943359375, -0.13516998291015625, -0.124603271484375, -0.11403656005859375, -0.1034698486328125, -0.09290313720703125, -0.08233642578125, -0.07176971435546875, -0.0612030029296875, -0.05063629150390625, -0.040069580078125, -0.02950286865234375, -0.0189361572265625, -0.00836944580078125, 0.002197265625, 0.01276397705078125, 0.0233306884765625, 0.03389739990234375, 0.044464111328125, 0.05503082275390625, 0.0655975341796875, 0.07616424560546875, 0.08673095703125, 0.09729766845703125, 0.1078643798828125, 0.11843109130859375, 0.128997802734375, 0.13956451416015625, 0.1501312255859375, 0.16069793701171875, 0.1712646484375, 0.18183135986328125, 0.1923980712890625, 0.20296478271484375, 0.213531494140625, 0.22409820556640625, 0.2346649169921875, 0.24523162841796875, 0.25579833984375, 0.26636505126953125, 0.2769317626953125, 0.28749847412109375, 0.298065185546875, 0.30863189697265625, 0.3191986083984375, 0.32976531982421875, 0.34033203125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 2.0, 4.0, 3.0, 6.0, 7.0, 5.0, 7.0, 12.0, 13.0, 9.0, 21.0, 20.0, 13.0, 26.0, 31.0, 39.0, 36.0, 61.0, 54.0, 65.0, 74.0, 80.0, 66.0, 54.0, 48.0, 33.0, 35.0, 23.0, 25.0, 25.0, 15.0, 19.0, 16.0, 8.0, 13.0, 5.0, 6.0, 5.0, 6.0, 2.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.6845703125, -0.6636428833007812, -0.6427154541015625, -0.6217880249023438, -0.600860595703125, -0.5799331665039062, -0.5590057373046875, -0.5380783081054688, -0.51715087890625, -0.49622344970703125, -0.4752960205078125, -0.45436859130859375, -0.433441162109375, -0.41251373291015625, -0.3915863037109375, -0.37065887451171875, -0.3497314453125, -0.32880401611328125, -0.3078765869140625, -0.28694915771484375, -0.266021728515625, -0.24509429931640625, -0.2241668701171875, -0.20323944091796875, -0.18231201171875, -0.16138458251953125, -0.1404571533203125, -0.11952972412109375, -0.098602294921875, -0.07767486572265625, -0.0567474365234375, -0.03582000732421875, -0.014892578125, 0.00603485107421875, 0.0269622802734375, 0.04788970947265625, 0.068817138671875, 0.08974456787109375, 0.1106719970703125, 0.13159942626953125, 0.15252685546875, 0.17345428466796875, 0.1943817138671875, 0.21530914306640625, 0.236236572265625, 0.25716400146484375, 0.2780914306640625, 0.29901885986328125, 0.3199462890625, 0.34087371826171875, 0.3618011474609375, 0.38272857666015625, 0.403656005859375, 0.42458343505859375, 0.4455108642578125, 0.46643829345703125, 0.48736572265625, 0.5082931518554688, 0.5292205810546875, 0.5501480102539062, 0.571075439453125, 0.5920028686523438, 0.6129302978515625, 0.6338577270507812, 0.65478515625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 6.0, 4.0, 4.0, 6.0, 11.0, 6.0, 16.0, 21.0, 21.0, 59.0, 61.0, 123.0, 208.0, 414.0, 1090.0, 3127.0, 14262.0, 169014.0, 830213.0, 22819.0, 4501.0, 1433.0, 550.0, 232.0, 123.0, 78.0, 42.0, 36.0, 22.0, 17.0, 13.0, 7.0, 6.0, 9.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07220458984375, -0.06995677947998047, -0.06770896911621094, -0.0654611587524414, -0.06321334838867188, -0.060965538024902344, -0.05871772766113281, -0.05646991729736328, -0.05422210693359375, -0.05197429656982422, -0.04972648620605469, -0.047478675842285156, -0.045230865478515625, -0.042983055114746094, -0.04073524475097656, -0.03848743438720703, -0.0362396240234375, -0.03399181365966797, -0.03174400329589844, -0.029496192932128906, -0.027248382568359375, -0.025000572204589844, -0.022752761840820312, -0.02050495147705078, -0.01825714111328125, -0.01600933074951172, -0.013761520385742188, -0.011513710021972656, -0.009265899658203125, -0.007018089294433594, -0.0047702789306640625, -0.0025224685668945312, -0.000274658203125, 0.0019731521606445312, 0.0042209625244140625, 0.006468772888183594, 0.008716583251953125, 0.010964393615722656, 0.013212203979492188, 0.015460014343261719, 0.01770782470703125, 0.01995563507080078, 0.022203445434570312, 0.024451255798339844, 0.026699066162109375, 0.028946876525878906, 0.031194686889648438, 0.03344249725341797, 0.0356903076171875, 0.03793811798095703, 0.04018592834472656, 0.042433738708496094, 0.044681549072265625, 0.046929359436035156, 0.04917716979980469, 0.05142498016357422, 0.05367279052734375, 0.05592060089111328, 0.05816841125488281, 0.060416221618652344, 0.06266403198242188, 0.0649118423461914, 0.06715965270996094, 0.06940746307373047, 0.0716552734375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 0.0, 7.0, 3.0, 5.0, 5.0, 11.0, 15.0, 10.0, 17.0, 31.0, 31.0, 37.0, 71.0, 91.0, 116.0, 140.0, 110.0, 78.0, 59.0, 34.0, 24.0, 29.0, 18.0, 20.0, 13.0, 6.0, 2.0, 14.0, 1.0, 7.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-5.4001808166503906e-05, -5.275662988424301e-05, -5.151145160198212e-05, -5.026627331972122e-05, -4.902109503746033e-05, -4.777591675519943e-05, -4.653073847293854e-05, -4.528556019067764e-05, -4.404038190841675e-05, -4.279520362615585e-05, -4.155002534389496e-05, -4.0304847061634064e-05, -3.905966877937317e-05, -3.7814490497112274e-05, -3.656931221485138e-05, -3.5324133932590485e-05, -3.407895565032959e-05, -3.2833777368068695e-05, -3.15885990858078e-05, -3.0343420803546906e-05, -2.909824252128601e-05, -2.7853064239025116e-05, -2.660788595676422e-05, -2.5362707674503326e-05, -2.411752939224243e-05, -2.2872351109981537e-05, -2.1627172827720642e-05, -2.0381994545459747e-05, -1.9136816263198853e-05, -1.7891637980937958e-05, -1.6646459698677063e-05, -1.5401281416416168e-05, -1.4156103134155273e-05, -1.2910924851894379e-05, -1.1665746569633484e-05, -1.0420568287372589e-05, -9.175390005111694e-06, -7.9302117228508e-06, -6.685033440589905e-06, -5.43985515832901e-06, -4.194676876068115e-06, -2.9494985938072205e-06, -1.7043203115463257e-06, -4.591420292854309e-07, 7.860362529754639e-07, 2.0312145352363586e-06, 3.2763928174972534e-06, 4.521571099758148e-06, 5.766749382019043e-06, 7.011927664279938e-06, 8.257105946540833e-06, 9.502284228801727e-06, 1.0747462511062622e-05, 1.1992640793323517e-05, 1.3237819075584412e-05, 1.4482997357845306e-05, 1.57281756401062e-05, 1.6973353922367096e-05, 1.821853220462799e-05, 1.9463710486888885e-05, 2.070888876914978e-05, 2.1954067051410675e-05, 2.319924533367157e-05, 2.4444423615932465e-05, 2.568960189819336e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 4.0, 2.0, 5.0, 8.0, 6.0, 15.0, 16.0, 20.0, 34.0, 49.0, 75.0, 99.0, 165.0, 322.0, 555.0, 1088.0, 2416.0, 5740.0, 16538.0, 64910.0, 814841.0, 105889.0, 22462.0, 7431.0, 2958.0, 1371.0, 657.0, 310.0, 197.0, 126.0, 69.0, 61.0, 26.0, 22.0, 21.0, 16.0, 14.0, 3.0, 4.0, 4.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.04925537109375, -0.04783296585083008, -0.046410560607910156, -0.044988155364990234, -0.04356575012207031, -0.04214334487915039, -0.04072093963623047, -0.03929853439331055, -0.037876129150390625, -0.0364537239074707, -0.03503131866455078, -0.03360891342163086, -0.03218650817871094, -0.030764102935791016, -0.029341697692871094, -0.027919292449951172, -0.02649688720703125, -0.025074481964111328, -0.023652076721191406, -0.022229671478271484, -0.020807266235351562, -0.01938486099243164, -0.01796245574951172, -0.016540050506591797, -0.015117645263671875, -0.013695240020751953, -0.012272834777832031, -0.01085042953491211, -0.009428024291992188, -0.008005619049072266, -0.006583213806152344, -0.005160808563232422, -0.0037384033203125, -0.002315998077392578, -0.0008935928344726562, 0.0005288124084472656, 0.0019512176513671875, 0.0033736228942871094, 0.004796028137207031, 0.006218433380126953, 0.007640838623046875, 0.009063243865966797, 0.010485649108886719, 0.01190805435180664, 0.013330459594726562, 0.014752864837646484, 0.016175270080566406, 0.017597675323486328, 0.01902008056640625, 0.020442485809326172, 0.021864891052246094, 0.023287296295166016, 0.024709701538085938, 0.02613210678100586, 0.02755451202392578, 0.028976917266845703, 0.030399322509765625, 0.03182172775268555, 0.03324413299560547, 0.03466653823852539, 0.03608894348144531, 0.037511348724365234, 0.038933753967285156, 0.04035615921020508, 0.041778564453125]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 6.0, 3.0, 2.0, 9.0, 7.0, 8.0, 9.0, 15.0, 8.0, 38.0, 33.0, 64.0, 82.0, 138.0, 148.0, 133.0, 92.0, 48.0, 35.0, 28.0, 26.0, 13.0, 13.0, 10.0, 6.0, 11.0, 1.0, 3.0, 2.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0826416015625, -0.08043527603149414, -0.07822895050048828, -0.07602262496948242, -0.07381629943847656, -0.0716099739074707, -0.06940364837646484, -0.06719732284545898, -0.06499099731445312, -0.06278467178344727, -0.060578346252441406, -0.05837202072143555, -0.05616569519042969, -0.05395936965942383, -0.05175304412841797, -0.04954671859741211, -0.04734039306640625, -0.04513406753540039, -0.04292774200439453, -0.04072141647338867, -0.03851509094238281, -0.03630876541137695, -0.034102439880371094, -0.031896114349365234, -0.029689788818359375, -0.027483463287353516, -0.025277137756347656, -0.023070812225341797, -0.020864486694335938, -0.018658161163330078, -0.01645183563232422, -0.01424551010131836, -0.0120391845703125, -0.00983285903930664, -0.007626533508300781, -0.005420207977294922, -0.0032138824462890625, -0.0010075569152832031, 0.0011987686157226562, 0.0034050941467285156, 0.005611419677734375, 0.007817745208740234, 0.010024070739746094, 0.012230396270751953, 0.014436721801757812, 0.016643047332763672, 0.01884937286376953, 0.02105569839477539, 0.02326202392578125, 0.02546834945678711, 0.02767467498779297, 0.029881000518798828, 0.03208732604980469, 0.03429365158081055, 0.036499977111816406, 0.038706302642822266, 0.040912628173828125, 0.043118953704833984, 0.045325279235839844, 0.0475316047668457, 0.04973793029785156, 0.05194425582885742, 0.05415058135986328, 0.05635690689086914, 0.058563232421875]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 6.0, 20.0, 35.0, 123.0, 607.0, 123.0, 51.0, 17.0, 5.0, 10.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.086722373962402, -6.946247100830078, -6.805771827697754, -6.66529655456543, -6.5248212814331055, -6.384346008300781, -6.243870735168457, -6.103395462036133, -5.962920188903809, -5.822444915771484, -5.68196964263916, -5.541494369506836, -5.401019096374512, -5.2605438232421875, -5.120068550109863, -4.979593276977539, -4.839118003845215, -4.698642730712891, -4.558167457580566, -4.417692184448242, -4.277216911315918, -4.136741638183594, -3.9962663650512695, -3.8557910919189453, -3.7153162956237793, -3.574841022491455, -3.434365749359131, -3.2938904762268066, -3.1534152030944824, -3.012939929962158, -2.872464656829834, -2.7319893836975098, -2.5915143489837646, -2.4510390758514404, -2.310563802719116, -2.170088529586792, -2.0296132564544678, -1.8891379833221436, -1.7486628293991089, -1.6081875562667847, -1.4677122831344604, -1.3272370100021362, -1.186761736869812, -1.0462865829467773, -0.9058112502098083, -0.7653359770774841, -0.6248607635498047, -0.48438549041748047, -0.34391021728515625, -0.20343495905399323, -0.0629597008228302, 0.07751554250717163, 0.21799081563949585, 0.35846608877182007, 0.4989413022994995, 0.6394165754318237, 0.779891848564148, 0.9203671216964722, 1.0608423948287964, 1.201317548751831, 1.3417928218841553, 1.4822680950164795, 1.6227433681488037, 1.763218641281128, 1.9036939144134521]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 3.0, 1.0, 3.0, 6.0, 11.0, 9.0, 14.0, 19.0, 16.0, 21.0, 31.0, 34.0, 40.0, 77.0, 273.0, 200.0, 50.0, 33.0, 28.0, 25.0, 22.0, 18.0, 17.0, 11.0, 8.0, 10.0, 7.0, 5.0, 0.0, 8.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.076354742050171, -1.9853906631469727, -1.8944265842437744, -1.8034626245498657, -1.7124985456466675, -1.6215344667434692, -1.5305705070495605, -1.4396064281463623, -1.348642349243164, -1.2576782703399658, -1.1667141914367676, -1.0757502317428589, -0.9847861528396606, -0.8938220739364624, -0.8028580546379089, -0.7118940353393555, -0.6209299564361572, -0.529965877532959, -0.4390018582344055, -0.34803780913352966, -0.2570737600326538, -0.16610971093177795, -0.0751456618309021, 0.015818357467651367, 0.10678243637084961, 0.19774648547172546, 0.2887105345726013, 0.3796745836734772, 0.470638632774353, 0.5616027116775513, 0.6525667309761047, 0.7435307502746582, 0.8344945907592773, 0.9254586696624756, 1.0164227485656738, 1.1073867082595825, 1.1983507871627808, 1.289314866065979, 1.3802788257598877, 1.471242904663086, 1.5622069835662842, 1.6531710624694824, 1.7441351413726807, 1.8350991010665894, 1.9260631799697876, 2.0170271396636963, 2.1079912185668945, 2.1989552974700928, 2.289919376373291, 2.3808834552764893, 2.4718475341796875, 2.5628116130828857, 2.653775691986084, 2.744739532470703, 2.8357036113739014, 2.9266676902770996, 3.017631769180298, 3.108595848083496, 3.1995599269866943, 3.2905240058898926, 3.3814878463745117, 3.47245192527771, 3.563416004180908, 3.6543800830841064, 3.7453441619873047]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 2.0, 3.0, 2.0, 2.0, 7.0, 11.0, 8.0, 12.0, 16.0, 17.0, 19.0, 22.0, 30.0, 50.0, 37.0, 43.0, 67.0, 214.0, 119.0, 53.0, 36.0, 40.0, 34.0, 28.0, 20.0, 26.0, 21.0, 17.0, 10.0, 11.0, 4.0, 4.0, 6.0, 4.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1778564453125, -0.17206764221191406, -0.16627883911132812, -0.1604900360107422, -0.15470123291015625, -0.1489124298095703, -0.14312362670898438, -0.13733482360839844, -0.1315460205078125, -0.12575721740722656, -0.11996841430664062, -0.11417961120605469, -0.10839080810546875, -0.10260200500488281, -0.09681320190429688, -0.09102439880371094, -0.085235595703125, -0.07944679260253906, -0.07365798950195312, -0.06786918640136719, -0.06208038330078125, -0.05629158020019531, -0.050502777099609375, -0.04471397399902344, -0.0389251708984375, -0.03313636779785156, -0.027347564697265625, -0.021558761596679688, -0.01576995849609375, -0.009981155395507812, -0.004192352294921875, 0.0015964508056640625, 0.00738525390625, 0.013174057006835938, 0.018962860107421875, 0.024751663208007812, 0.03054046630859375, 0.03632926940917969, 0.042118072509765625, 0.04790687561035156, 0.0536956787109375, 0.05948448181152344, 0.06527328491210938, 0.07106208801269531, 0.07685089111328125, 0.08263969421386719, 0.08842849731445312, 0.09421730041503906, 0.100006103515625, 0.10579490661621094, 0.11158370971679688, 0.11737251281738281, 0.12316131591796875, 0.1289501190185547, 0.13473892211914062, 0.14052772521972656, 0.1463165283203125, 0.15210533142089844, 0.15789413452148438, 0.1636829376220703, 0.16947174072265625, 0.1752605438232422, 0.18104934692382812, 0.18683815002441406, 0.192626953125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 7.0, 12.0, 2.0, 1.0, 7.0, 9.0, 14.0, 17.0, 45.0, 50.0, 77.0, 167.0, 379.0, 1301.0, 10077.0, 8362151.0, 12084.0, 1435.0, 374.0, 154.0, 79.0, 55.0, 23.0, 21.0, 14.0, 9.0, 13.0, 5.0, 6.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7340997457504272, -1.6687462329864502, -1.6033926010131836, -1.5380390882492065, -1.4726855754852295, -1.4073320627212524, -1.3419785499572754, -1.2766249179840088, -1.2112714052200317, -1.1459178924560547, -1.080564260482788, -1.015210747718811, -0.949857234954834, -0.8845037221908569, -0.8191501498222351, -0.7537965774536133, -0.6884430646896362, -0.6230895519256592, -0.5577359795570374, -0.4923824369907379, -0.4270288944244385, -0.36167535185813904, -0.2963218092918396, -0.23096826672554016, -0.16561472415924072, -0.10026118159294128, -0.034907639026641846, 0.030445903539657593, 0.09579944610595703, 0.16115298867225647, 0.2265065312385559, 0.29186007380485535, 0.35721349716186523, 0.4225670397281647, 0.4879205822944641, 0.5532741546630859, 0.618627667427063, 0.68398118019104, 0.7493347525596619, 0.8146883249282837, 0.8800418376922607, 0.9453953504562378, 1.0107488632202148, 1.0761024951934814, 1.1414560079574585, 1.2068095207214355, 1.2721631526947021, 1.3375166654586792, 1.4028701782226562, 1.4682236909866333, 1.5335772037506104, 1.598930835723877, 1.664284348487854, 1.729637861251831, 1.7949914932250977, 1.8603450059890747, 1.9256985187530518, 1.9910520315170288, 2.056405544281006, 2.1217591762542725, 2.187112808227539, 2.2524662017822266, 2.317819833755493, 2.3831732273101807, 2.4485268592834473]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 1.0, 3.0, 2.0, 4.0, 4.0, 6.0, 4.0, 1.0, 8.0, 1.0, 5.0, 7.0, 8.0, 4.0, 6.0, 1.0, 3.0, 7.0, 5.0, 4.0, 2.0, 3.0, 1.0, 3.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.914140224456787, -2.838815212249756, -2.7634899616241455, -2.688164710998535, -2.612839698791504, -2.5375146865844727, -2.4621894359588623, -2.386864185333252, -2.3115391731262207, -2.2362141609191895, -2.160888910293579, -2.0855636596679688, -2.0102386474609375, -1.9349135160446167, -1.859588384628296, -1.784263253211975, -1.7089381217956543, -1.6336129903793335, -1.5582878589630127, -1.482962727546692, -1.407637596130371, -1.3323124647140503, -1.2569873332977295, -1.1816622018814087, -1.106337070465088, -1.031011939048767, -0.9556868076324463, -0.8803616762161255, -0.8050365447998047, -0.7297114133834839, -0.6543862819671631, -0.5790611505508423, -0.5037362575531006, -0.4284111261367798, -0.353085994720459, -0.2777608633041382, -0.20243573188781738, -0.12711060047149658, -0.05178546905517578, 0.02353966236114502, 0.09886479377746582, 0.17418992519378662, 0.24951505661010742, 0.3248401880264282, 0.400165319442749, 0.4754904508590698, 0.5508155822753906, 0.6261407136917114, 0.7014658451080322, 0.776790976524353, 0.8521161079406738, 0.9274412393569946, 1.0027663707733154, 1.0780915021896362, 1.153416633605957, 1.2287417650222778, 1.3040668964385986, 1.3793920278549194, 1.4547171592712402, 1.530042290687561, 1.6053674221038818, 1.6806925535202026, 1.7560176849365234, 1.8313428163528442, 1.906667947769165]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 7.0, 8.0, 5.0, 7.0, 5.0, 14.0, 25.0, 14.0, 27.0, 40.0, 53.0, 48.0, 70.0, 51.0, 75.0, 78.0, 81.0, 67.0, 58.0, 56.0, 53.0, 33.0, 35.0, 22.0, 16.0, 11.0, 10.0, 6.0, 9.0, 5.0, 4.0, 2.0, 2.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08343505859375, -0.08044052124023438, -0.07744598388671875, -0.07445144653320312, -0.0714569091796875, -0.06846237182617188, -0.06546783447265625, -0.062473297119140625, -0.059478759765625, -0.056484222412109375, -0.05348968505859375, -0.050495147705078125, -0.0475006103515625, -0.044506072998046875, -0.04151153564453125, -0.038516998291015625, -0.0355224609375, -0.032527923583984375, -0.02953338623046875, -0.026538848876953125, -0.0235443115234375, -0.020549774169921875, -0.01755523681640625, -0.014560699462890625, -0.011566162109375, -0.008571624755859375, -0.00557708740234375, -0.002582550048828125, 0.0004119873046875, 0.003406524658203125, 0.00640106201171875, 0.009395599365234375, 0.01239013671875, 0.015384674072265625, 0.01837921142578125, 0.021373748779296875, 0.0243682861328125, 0.027362823486328125, 0.03035736083984375, 0.033351898193359375, 0.036346435546875, 0.039340972900390625, 0.04233551025390625, 0.045330047607421875, 0.0483245849609375, 0.051319122314453125, 0.05431365966796875, 0.057308197021484375, 0.060302734375, 0.06329727172851562, 0.06629180908203125, 0.06928634643554688, 0.0722808837890625, 0.07527542114257812, 0.07826995849609375, 0.08126449584960938, 0.084259033203125, 0.08725357055664062, 0.09024810791015625, 0.09324264526367188, 0.0962371826171875, 0.09923171997070312, 0.10222625732421875, 0.10522079467773438, 0.10821533203125]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 4.0, 4.0, 6.0, 2.0, 10.0, 8.0, 20.0, 20.0, 26.0, 22.0, 60.0, 55.0, 106.0, 176.0, 286.0, 510.0, 1073.0, 2428.0, 6607.0, 19003.0, 61506.0, 180164.0, 168314.0, 55537.0, 17535.0, 6069.0, 2389.0, 1041.0, 524.0, 260.0, 151.0, 91.0, 76.0, 52.0, 33.0, 28.0, 16.0, 13.0, 12.0, 11.0, 6.0, 3.0, 4.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.087890625, -1.0538482666015625, -1.019805908203125, -0.9857635498046875, -0.95172119140625, -0.9176788330078125, -0.883636474609375, -0.8495941162109375, -0.8155517578125, -0.7815093994140625, -0.747467041015625, -0.7134246826171875, -0.67938232421875, -0.6453399658203125, -0.611297607421875, -0.5772552490234375, -0.543212890625, -0.5091705322265625, -0.475128173828125, -0.4410858154296875, -0.40704345703125, -0.3730010986328125, -0.338958740234375, -0.3049163818359375, -0.2708740234375, -0.2368316650390625, -0.202789306640625, -0.1687469482421875, -0.13470458984375, -0.1006622314453125, -0.066619873046875, -0.0325775146484375, 0.00146484375, 0.0355072021484375, 0.069549560546875, 0.1035919189453125, 0.13763427734375, 0.1716766357421875, 0.205718994140625, 0.2397613525390625, 0.2738037109375, 0.3078460693359375, 0.341888427734375, 0.3759307861328125, 0.40997314453125, 0.4440155029296875, 0.478057861328125, 0.5121002197265625, 0.546142578125, 0.5801849365234375, 0.614227294921875, 0.6482696533203125, 0.68231201171875, 0.7163543701171875, 0.750396728515625, 0.7844390869140625, 0.8184814453125, 0.8525238037109375, 0.886566162109375, 0.9206085205078125, 0.95465087890625, 0.9886932373046875, 1.022735595703125, 1.0567779541015625, 1.0908203125]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 8.0, 7.0, 8.0, 12.0, 12.0, 17.0, 28.0, 39.0, 60.0, 58.0, 67.0, 108.0, 119.0, 107.0, 80.0, 69.0, 55.0, 43.0, 25.0, 26.0, 17.0, 12.0, 7.0, 8.0, 3.0, 4.0, 1.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.23291015625, -0.22381210327148438, -0.21471405029296875, -0.20561599731445312, -0.1965179443359375, -0.18741989135742188, -0.17832183837890625, -0.16922378540039062, -0.160125732421875, -0.15102767944335938, -0.14192962646484375, -0.13283157348632812, -0.1237335205078125, -0.11463546752929688, -0.10553741455078125, -0.09643936157226562, -0.08734130859375, -0.07824325561523438, -0.06914520263671875, -0.060047149658203125, -0.0509490966796875, -0.041851043701171875, -0.03275299072265625, -0.023654937744140625, -0.014556884765625, -0.005458831787109375, 0.00363922119140625, 0.012737274169921875, 0.0218353271484375, 0.030933380126953125, 0.04003143310546875, 0.049129486083984375, 0.0582275390625, 0.06732559204101562, 0.07642364501953125, 0.08552169799804688, 0.0946197509765625, 0.10371780395507812, 0.11281585693359375, 0.12191390991210938, 0.131011962890625, 0.14011001586914062, 0.14920806884765625, 0.15830612182617188, 0.1674041748046875, 0.17650222778320312, 0.18560028076171875, 0.19469833374023438, 0.20379638671875, 0.21289443969726562, 0.22199249267578125, 0.23109054565429688, 0.2401885986328125, 0.24928665161132812, 0.25838470458984375, 0.2674827575683594, 0.276580810546875, 0.2856788635253906, 0.29477691650390625, 0.3038749694824219, 0.3129730224609375, 0.3220710754394531, 0.33116912841796875, 0.3402671813964844, 0.349365234375]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 1.0, 3.0, 7.0, 10.0, 17.0, 32.0, 51.0, 99.0, 104.0, 64.0, 51.0, 18.0, 9.0, 6.0, 7.0, 3.0, 7.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9511016607284546, -0.8965842127799988, -0.8420668244361877, -0.7875493764877319, -0.7330319881439209, -0.6785145401954651, -0.6239970922470093, -0.5694797039031982, -0.5149622559547424, -0.460444837808609, -0.4059274196624756, -0.3514099717140198, -0.29689255356788635, -0.24237513542175293, -0.18785768747329712, -0.1333402693271637, -0.07882285118103027, -0.024305425584316254, 0.030212000012397766, 0.08472943305969238, 0.1392468512058258, 0.19376426935195923, 0.24828171730041504, 0.30279913544654846, 0.3573165535926819, 0.4118339717388153, 0.46635138988494873, 0.5208688378334045, 0.5753862857818604, 0.6299036741256714, 0.6844211220741272, 0.738938570022583, 0.7934558391571045, 0.8479732871055603, 0.9024906754493713, 0.9570081233978271, 1.0115255117416382, 1.0660429000854492, 1.1205604076385498, 1.1750777959823608, 1.2295951843261719, 1.284112572669983, 1.3386300802230835, 1.3931474685668945, 1.4476648569107056, 1.5021822452545166, 1.5566997528076172, 1.6112171411514282, 1.6657346487045288, 1.7202520370483398, 1.7747695446014404, 1.8292869329452515, 1.8838043212890625, 1.938321828842163, 1.9928392171859741, 2.047356605529785, 2.1018741130828857, 2.1563916206359863, 2.210908889770508, 2.2654263973236084, 2.319943904876709, 2.3744611740112305, 2.428978681564331, 2.4834961891174316, 2.538013458251953]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 6.0, 0.0, 5.0, 3.0, 1.0, 2.0, 5.0, 10.0, 4.0, 13.0, 23.0, 20.0, 49.0, 70.0, 76.0, 66.0, 35.0, 35.0, 19.0, 12.0, 9.0, 6.0, 6.0, 4.0, 2.0, 4.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2129456996917725, -1.1660399436950684, -1.1191341876983643, -1.0722284317016602, -1.025322675704956, -0.9784169793128967, -0.9315112829208374, -0.8846055269241333, -0.8376997709274292, -0.7907940149307251, -0.743888258934021, -0.6969825625419617, -0.6500768065452576, -0.6031710505485535, -0.5562653541564941, -0.50935959815979, -0.46245384216308594, -0.41554808616638184, -0.3686423599720001, -0.3217366337776184, -0.2748308777809143, -0.2279251366853714, -0.1810193955898285, -0.13411366939544678, -0.08720791339874268, -0.04030217230319977, 0.00660356879234314, 0.05350930988788605, 0.10041505098342896, 0.14732079207897186, 0.19422653317451477, 0.24113225936889648, 0.28803789615631104, 0.33494365215301514, 0.38184937834739685, 0.42875510454177856, 0.47566086053848267, 0.5225666165351868, 0.5694723129272461, 0.6163780689239502, 0.6632838249206543, 0.7101895809173584, 0.7570953369140625, 0.8040010333061218, 0.8509067893028259, 0.89781254529953, 0.9447182416915894, 0.9916239976882935, 1.0385297536849976, 1.0854355096817017, 1.1323412656784058, 1.1792470216751099, 1.2261526584625244, 1.2730584144592285, 1.3199641704559326, 1.3668699264526367, 1.4137756824493408, 1.460681438446045, 1.507587194442749, 1.5544929504394531, 1.6013987064361572, 1.6483043432235718, 1.6952100992202759, 1.74211585521698, 1.789021611213684]}, "eval/loss": 4.050220966339111, "eval/wer": 1.7867314557715193, "eval/runtime": 594.0081, "eval/samples_per_second": 4.448, "eval/steps_per_second": 0.557} \ No newline at end of file +{"train/loss": 0.1399, "train/learning_rate": 5.804878048780487e-05, "train/epoch": 4.48, "train/global_step": 1000, "_runtime": 23379, "_timestamp": 1648260507, "_step": 1001, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 4.0, 12.0, 33.0, 69.0, 114.0, 204.0, 218.0, 169.0, 114.0, 54.0, 24.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6282283663749695, -0.5442143082618713, -0.4602002799510956, -0.3761862516403198, -0.2921721935272217, -0.20815813541412354, -0.12414413690567017, -0.04013007879257202, 0.04388397932052612, 0.12789802253246307, 0.21191206574440002, 0.2959260940551758, 0.3799401521682739, 0.46395421028137207, 0.5479682087898254, 0.6319822669029236, 0.7159963250160217, 0.8000103831291199, 0.8840243816375732, 0.9680384397506714, 1.0520524978637695, 1.1360665559768677, 1.2200806140899658, 1.3040945529937744, 1.388108730316162, 1.4721227884292603, 1.5561368465423584, 1.640150785446167, 1.7241649627685547, 1.8081789016723633, 1.8921929597854614, 1.9762070178985596, 2.0602211952209473, 2.144235134124756, 2.2282493114471436, 2.312263250350952, 2.39627742767334, 2.4802913665771484, 2.564305305480957, 2.6483194828033447, 2.7323336601257324, 2.816347599029541, 2.9003617763519287, 2.9843757152557373, 3.068389892578125, 3.1524038314819336, 3.236417770385742, 3.32043194770813, 3.4044458866119385, 3.488459825515747, 3.5724740028381348, 3.6564879417419434, 3.740502119064331, 3.8245160579681396, 3.9085302352905273, 3.992544174194336, 4.0765581130981445, 4.160572052001953, 4.244585990905762, 4.3286004066467285, 4.412614345550537, 4.496628284454346, 4.580642223358154, 4.664656639099121, 4.74867057800293]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 5.0, 7.0, 3.0, 11.0, 8.0, 13.0, 15.0, 12.0, 15.0, 19.0, 21.0, 26.0, 26.0, 30.0, 16.0, 37.0, 48.0, 41.0, 30.0, 29.0, 34.0, 33.0, 45.0, 37.0, 35.0, 32.0, 36.0, 31.0, 24.0, 26.0, 30.0, 25.0, 25.0, 26.0, 22.0, 21.0, 19.0, 10.0, 14.0, 11.0, 7.0, 10.0, 5.0, 9.0, 3.0, 3.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0], "bins": [-0.6512007117271423, -0.6314267516136169, -0.6116528511047363, -0.5918788909912109, -0.5721049308776855, -0.5523310303688049, -0.5325570702552795, -0.5127831697463989, -0.49300920963287354, -0.47323527932167053, -0.45346134901046753, -0.43368738889694214, -0.41391345858573914, -0.39413952827453613, -0.37436556816101074, -0.35459163784980774, -0.33481770753860474, -0.31504377722740173, -0.29526984691619873, -0.27549588680267334, -0.25572195649147034, -0.23594802618026733, -0.21617408096790314, -0.19640013575553894, -0.17662620544433594, -0.15685227513313293, -0.13707832992076874, -0.11730439215898514, -0.09753045439720154, -0.07775651663541794, -0.05798257887363434, -0.03820863366127014, -0.01843470335006714, 0.0013392344117164612, 0.02111317217350006, 0.04088710993528366, 0.06066104769706726, 0.08043498545885086, 0.10020892322063446, 0.11998286843299866, 0.13975679874420166, 0.15953072905540466, 0.17930467426776886, 0.19907861948013306, 0.21885254979133606, 0.23862648010253906, 0.25840044021606445, 0.27817437052726746, 0.29794830083847046, 0.31772223114967346, 0.33749616146087646, 0.35727012157440186, 0.37704405188560486, 0.39681798219680786, 0.41659194231033325, 0.43636587262153625, 0.45613980293273926, 0.47591373324394226, 0.49568766355514526, 0.5154616236686707, 0.5352355241775513, 0.5550094842910767, 0.574783444404602, 0.5945574045181274, 0.6143313050270081]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 4.0, 6.0, 8.0, 11.0, 17.0, 20.0, 25.0, 41.0, 57.0, 78.0, 97.0, 144.0, 157.0, 242.0, 361.0, 536.0, 812.0, 1261.0, 2350.0, 5105.0, 14067.0, 54606.0, 330245.0, 1770445.0, 1647513.0, 290964.0, 50858.0, 13409.0, 4942.0, 2230.0, 1237.0, 719.0, 453.0, 345.0, 234.0, 185.0, 131.0, 96.0, 73.0, 62.0, 39.0, 23.0, 24.0, 22.0, 9.0, 12.0, 5.0, 3.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.275390625, -2.2042236328125, -2.133056640625, -2.0618896484375, -1.99072265625, -1.9195556640625, -1.848388671875, -1.7772216796875, -1.7060546875, -1.6348876953125, -1.563720703125, -1.4925537109375, -1.42138671875, -1.3502197265625, -1.279052734375, -1.2078857421875, -1.13671875, -1.0655517578125, -0.994384765625, -0.9232177734375, -0.85205078125, -0.7808837890625, -0.709716796875, -0.6385498046875, -0.5673828125, -0.4962158203125, -0.425048828125, -0.3538818359375, -0.28271484375, -0.2115478515625, -0.140380859375, -0.0692138671875, 0.001953125, 0.0731201171875, 0.144287109375, 0.2154541015625, 0.28662109375, 0.3577880859375, 0.428955078125, 0.5001220703125, 0.5712890625, 0.6424560546875, 0.713623046875, 0.7847900390625, 0.85595703125, 0.9271240234375, 0.998291015625, 1.0694580078125, 1.140625, 1.2117919921875, 1.282958984375, 1.3541259765625, 1.42529296875, 1.4964599609375, 1.567626953125, 1.6387939453125, 1.7099609375, 1.7811279296875, 1.852294921875, 1.9234619140625, 1.99462890625, 2.0657958984375, 2.136962890625, 2.2081298828125, 2.279296875]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 4.0, 6.0, 2.0, 2.0, 9.0, 7.0, 5.0, 12.0, 13.0, 16.0, 14.0, 25.0, 20.0, 19.0, 22.0, 27.0, 20.0, 38.0, 38.0, 30.0, 38.0, 52.0, 34.0, 42.0, 32.0, 44.0, 30.0, 37.0, 42.0, 38.0, 43.0, 25.0, 33.0, 16.0, 31.0, 16.0, 15.0, 17.0, 15.0, 14.0, 9.0, 10.0, 7.0, 7.0, 5.0, 8.0, 3.0, 3.0, 0.0, 3.0, 4.0, 2.0, 1.0, 5.0, 0.0, 1.0], "bins": [-1.220703125, -1.1827545166015625, -1.144805908203125, -1.1068572998046875, -1.06890869140625, -1.0309600830078125, -0.993011474609375, -0.9550628662109375, -0.9171142578125, -0.8791656494140625, -0.841217041015625, -0.8032684326171875, -0.76531982421875, -0.7273712158203125, -0.689422607421875, -0.6514739990234375, -0.613525390625, -0.5755767822265625, -0.537628173828125, -0.4996795654296875, -0.46173095703125, -0.4237823486328125, -0.385833740234375, -0.3478851318359375, -0.3099365234375, -0.2719879150390625, -0.234039306640625, -0.1960906982421875, -0.15814208984375, -0.1201934814453125, -0.082244873046875, -0.0442962646484375, -0.00634765625, 0.0316009521484375, 0.069549560546875, 0.1074981689453125, 0.14544677734375, 0.1833953857421875, 0.221343994140625, 0.2592926025390625, 0.2972412109375, 0.3351898193359375, 0.373138427734375, 0.4110870361328125, 0.44903564453125, 0.4869842529296875, 0.524932861328125, 0.5628814697265625, 0.600830078125, 0.6387786865234375, 0.676727294921875, 0.7146759033203125, 0.75262451171875, 0.7905731201171875, 0.828521728515625, 0.8664703369140625, 0.9044189453125, 0.9423675537109375, 0.980316162109375, 1.0182647705078125, 1.05621337890625, 1.0941619873046875, 1.132110595703125, 1.1700592041015625, 1.2080078125]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 3.0, 4.0, 10.0, 12.0, 13.0, 27.0, 34.0, 50.0, 104.0, 235.0, 659.0, 4144.0, 4156266.0, 31072.0, 1025.0, 298.0, 115.0, 76.0, 47.0, 29.0, 20.0, 15.0, 11.0, 6.0, 3.0, 3.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.125, -17.656494140625, -17.18798828125, -16.719482421875, -16.2509765625, -15.782470703125, -15.31396484375, -14.845458984375, -14.376953125, -13.908447265625, -13.43994140625, -12.971435546875, -12.5029296875, -12.034423828125, -11.56591796875, -11.097412109375, -10.62890625, -10.160400390625, -9.69189453125, -9.223388671875, -8.7548828125, -8.286376953125, -7.81787109375, -7.349365234375, -6.880859375, -6.412353515625, -5.94384765625, -5.475341796875, -5.0068359375, -4.538330078125, -4.06982421875, -3.601318359375, -3.1328125, -2.664306640625, -2.19580078125, -1.727294921875, -1.2587890625, -0.790283203125, -0.32177734375, 0.146728515625, 0.615234375, 1.083740234375, 1.55224609375, 2.020751953125, 2.4892578125, 2.957763671875, 3.42626953125, 3.894775390625, 4.36328125, 4.831787109375, 5.30029296875, 5.768798828125, 6.2373046875, 6.705810546875, 7.17431640625, 7.642822265625, 8.111328125, 8.579833984375, 9.04833984375, 9.516845703125, 9.9853515625, 10.453857421875, 10.92236328125, 11.390869140625, 11.859375]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 9.0, 15.0, 12.0, 18.0, 33.0, 56.0, 67.0, 106.0, 173.0, 327.0, 650.0, 990.0, 718.0, 375.0, 189.0, 129.0, 74.0, 47.0, 23.0, 28.0, 9.0, 10.0, 7.0, 4.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0], "bins": [-1.1572265625, -1.1300506591796875, -1.102874755859375, -1.0756988525390625, -1.04852294921875, -1.0213470458984375, -0.994171142578125, -0.9669952392578125, -0.9398193359375, -0.9126434326171875, -0.885467529296875, -0.8582916259765625, -0.83111572265625, -0.8039398193359375, -0.776763916015625, -0.7495880126953125, -0.722412109375, -0.6952362060546875, -0.668060302734375, -0.6408843994140625, -0.61370849609375, -0.5865325927734375, -0.559356689453125, -0.5321807861328125, -0.5050048828125, -0.4778289794921875, -0.450653076171875, -0.4234771728515625, -0.39630126953125, -0.3691253662109375, -0.341949462890625, -0.3147735595703125, -0.28759765625, -0.2604217529296875, -0.233245849609375, -0.2060699462890625, -0.17889404296875, -0.1517181396484375, -0.124542236328125, -0.0973663330078125, -0.0701904296875, -0.0430145263671875, -0.015838623046875, 0.0113372802734375, 0.03851318359375, 0.0656890869140625, 0.092864990234375, 0.1200408935546875, 0.147216796875, 0.1743927001953125, 0.201568603515625, 0.2287445068359375, 0.25592041015625, 0.2830963134765625, 0.310272216796875, 0.3374481201171875, 0.3646240234375, 0.3917999267578125, 0.418975830078125, 0.4461517333984375, 0.47332763671875, 0.5005035400390625, 0.527679443359375, 0.5548553466796875, 0.58203125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 6.0, 7.0, 7.0, 17.0, 13.0, 18.0, 14.0, 23.0, 27.0, 27.0, 36.0, 51.0, 63.0, 63.0, 67.0, 62.0, 67.0, 53.0, 68.0, 55.0, 44.0, 43.0, 30.0, 30.0, 31.0, 19.0, 18.0, 10.0, 11.0, 6.0, 9.0, 4.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.607733130455017, -1.5505421161651611, -1.4933512210845947, -1.4361602067947388, -1.3789691925048828, -1.3217781782150269, -1.264587163925171, -1.2073962688446045, -1.1502052545547485, -1.0930142402648926, -1.0358233451843262, -0.9786323308944702, -0.9214413166046143, -0.8642503023147583, -0.8070593476295471, -0.7498683929443359, -0.69267737865448, -0.635486364364624, -0.5782954096794128, -0.5211044549942017, -0.4639134407043457, -0.40672245621681213, -0.34953147172927856, -0.292340487241745, -0.23514950275421143, -0.17795851826667786, -0.12076753377914429, -0.06357654929161072, -0.0063855648040771484, 0.05080541968345642, 0.10799640417098999, 0.16518738865852356, 0.22237825393676758, 0.27956923842430115, 0.3367602229118347, 0.3939512073993683, 0.45114219188690186, 0.5083332061767578, 0.565524160861969, 0.6227151155471802, 0.6799061298370361, 0.7370971441268921, 0.7942880988121033, 0.8514790534973145, 0.9086700677871704, 0.9658610820770264, 1.0230519771575928, 1.0802429914474487, 1.1374340057373047, 1.1946250200271606, 1.2518160343170166, 1.309006929397583, 1.366197943687439, 1.423388957977295, 1.4805798530578613, 1.5377708673477173, 1.5949618816375732, 1.6521528959274292, 1.7093439102172852, 1.7665348052978516, 1.8237258195877075, 1.8809168338775635, 1.9381077289581299, 1.9952987432479858, 2.052489757537842]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 0.0, 4.0, 7.0, 7.0, 6.0, 6.0, 12.0, 12.0, 12.0, 12.0, 17.0, 24.0, 28.0, 23.0, 30.0, 29.0, 31.0, 40.0, 32.0, 50.0, 42.0, 47.0, 37.0, 37.0, 42.0, 37.0, 41.0, 30.0, 30.0, 37.0, 34.0, 32.0, 31.0, 27.0, 19.0, 11.0, 12.0, 18.0, 10.0, 13.0, 8.0, 8.0, 4.0, 3.0, 4.0, 4.0, 2.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.3626282215118408, -1.3228709697723389, -1.283113718032837, -1.243356466293335, -1.203599214553833, -1.163841962814331, -1.124084711074829, -1.0843275785446167, -1.0445703268051147, -1.0048130750656128, -0.9650558233261108, -0.9252985715866089, -0.8855413794517517, -0.8457841277122498, -0.8060268759727478, -0.7662696838378906, -0.7265123724937439, -0.6867551207542419, -0.64699786901474, -0.6072406768798828, -0.5674834251403809, -0.5277261734008789, -0.48796892166137695, -0.4482116997241974, -0.40845444798469543, -0.3686971962451935, -0.3289399743080139, -0.28918272256851196, -0.2494254857301712, -0.20966824889183044, -0.1699109971523285, -0.13015377521514893, -0.09039652347564697, -0.050639282912015915, -0.010882042348384857, 0.0288752019405365, 0.06863243877887726, 0.10838967561721802, 0.14814692735671997, 0.18790414929389954, 0.2276614010334015, 0.26741865277290344, 0.307175874710083, 0.34693312644958496, 0.3866903781890869, 0.4264476001262665, 0.46620485186576843, 0.505962073802948, 0.54571932554245, 0.5854765772819519, 0.6252338290214539, 0.664991021156311, 0.704748272895813, 0.7445055246353149, 0.7842627763748169, 0.8240200281143188, 0.8637772798538208, 0.9035345315933228, 0.9432917833328247, 0.9830490350723267, 1.0228062868118286, 1.062563419342041, 1.102320671081543, 1.142077922821045, 1.1818351745605469]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 6.0, 8.0, 10.0, 16.0, 9.0, 13.0, 35.0, 36.0, 57.0, 76.0, 112.0, 163.0, 257.0, 356.0, 495.0, 755.0, 1166.0, 1832.0, 2828.0, 4551.0, 7334.0, 11790.0, 19237.0, 31382.0, 49733.0, 75503.0, 109138.0, 149427.0, 167305.0, 136680.0, 97392.0, 66818.0, 43133.0, 26990.0, 16337.0, 10206.0, 6393.0, 3887.0, 2407.0, 1551.0, 1034.0, 682.0, 445.0, 307.0, 191.0, 163.0, 87.0, 68.0, 49.0, 38.0, 26.0, 21.0, 16.0, 6.0, 0.0, 6.0, 3.0, 2.0, 2.0, 1.0], "bins": [-0.45068359375, -0.4367485046386719, -0.42281341552734375, -0.4088783264160156, -0.3949432373046875, -0.3810081481933594, -0.36707305908203125, -0.3531379699707031, -0.339202880859375, -0.3252677917480469, -0.31133270263671875, -0.2973976135253906, -0.2834625244140625, -0.2695274353027344, -0.25559234619140625, -0.24165725708007812, -0.22772216796875, -0.21378707885742188, -0.19985198974609375, -0.18591690063476562, -0.1719818115234375, -0.15804672241210938, -0.14411163330078125, -0.13017654418945312, -0.116241455078125, -0.10230636596679688, -0.08837127685546875, -0.07443618774414062, -0.0605010986328125, -0.046566009521484375, -0.03263092041015625, -0.018695831298828125, -0.0047607421875, 0.009174346923828125, 0.02310943603515625, 0.037044525146484375, 0.0509796142578125, 0.06491470336914062, 0.07884979248046875, 0.09278488159179688, 0.106719970703125, 0.12065505981445312, 0.13459014892578125, 0.14852523803710938, 0.1624603271484375, 0.17639541625976562, 0.19033050537109375, 0.20426559448242188, 0.21820068359375, 0.23213577270507812, 0.24607086181640625, 0.2600059509277344, 0.2739410400390625, 0.2878761291503906, 0.30181121826171875, 0.3157463073730469, 0.329681396484375, 0.3436164855957031, 0.35755157470703125, 0.3714866638183594, 0.3854217529296875, 0.3993568420410156, 0.41329193115234375, 0.4272270202636719, 0.441162109375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 2.0, 9.0, 6.0, 3.0, 13.0, 10.0, 14.0, 18.0, 12.0, 23.0, 34.0, 33.0, 31.0, 40.0, 35.0, 44.0, 34.0, 40.0, 34.0, 46.0, 39.0, 44.0, 43.0, 43.0, 44.0, 35.0, 33.0, 32.0, 29.0, 25.0, 24.0, 16.0, 27.0, 10.0, 18.0, 10.0, 10.0, 5.0, 7.0, 5.0, 5.0, 4.0, 5.0, 3.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.79296875, -0.76776123046875, -0.7425537109375, -0.71734619140625, -0.692138671875, -0.66693115234375, -0.6417236328125, -0.61651611328125, -0.59130859375, -0.56610107421875, -0.5408935546875, -0.51568603515625, -0.490478515625, -0.46527099609375, -0.4400634765625, -0.41485595703125, -0.3896484375, -0.36444091796875, -0.3392333984375, -0.31402587890625, -0.288818359375, -0.26361083984375, -0.2384033203125, -0.21319580078125, -0.18798828125, -0.16278076171875, -0.1375732421875, -0.11236572265625, -0.087158203125, -0.06195068359375, -0.0367431640625, -0.01153564453125, 0.013671875, 0.03887939453125, 0.0640869140625, 0.08929443359375, 0.114501953125, 0.13970947265625, 0.1649169921875, 0.19012451171875, 0.21533203125, 0.24053955078125, 0.2657470703125, 0.29095458984375, 0.316162109375, 0.34136962890625, 0.3665771484375, 0.39178466796875, 0.4169921875, 0.44219970703125, 0.4674072265625, 0.49261474609375, 0.517822265625, 0.54302978515625, 0.5682373046875, 0.59344482421875, 0.61865234375, 0.64385986328125, 0.6690673828125, 0.69427490234375, 0.719482421875, 0.74468994140625, 0.7698974609375, 0.79510498046875, 0.8203125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 7.0, 4.0, 11.0, 5.0, 12.0, 17.0, 30.0, 33.0, 66.0, 86.0, 120.0, 265.0, 464.0, 856.0, 1821.0, 4691.0, 13456.0, 42485.0, 134809.0, 336255.0, 324697.0, 127626.0, 40222.0, 12479.0, 4443.0, 1736.0, 833.0, 406.0, 208.0, 152.0, 92.0, 52.0, 39.0, 27.0, 15.0, 14.0, 6.0, 7.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8916015625, -0.8628158569335938, -0.8340301513671875, -0.8052444458007812, -0.776458740234375, -0.7476730346679688, -0.7188873291015625, -0.6901016235351562, -0.66131591796875, -0.6325302124023438, -0.6037445068359375, -0.5749588012695312, -0.546173095703125, -0.5173873901367188, -0.4886016845703125, -0.45981597900390625, -0.4310302734375, -0.40224456787109375, -0.3734588623046875, -0.34467315673828125, -0.315887451171875, -0.28710174560546875, -0.2583160400390625, -0.22953033447265625, -0.20074462890625, -0.17195892333984375, -0.1431732177734375, -0.11438751220703125, -0.085601806640625, -0.05681610107421875, -0.0280303955078125, 0.00075531005859375, 0.029541015625, 0.05832672119140625, 0.0871124267578125, 0.11589813232421875, 0.144683837890625, 0.17346954345703125, 0.2022552490234375, 0.23104095458984375, 0.25982666015625, 0.28861236572265625, 0.3173980712890625, 0.34618377685546875, 0.374969482421875, 0.40375518798828125, 0.4325408935546875, 0.46132659912109375, 0.4901123046875, 0.5188980102539062, 0.5476837158203125, 0.5764694213867188, 0.605255126953125, 0.6340408325195312, 0.6628265380859375, 0.6916122436523438, 0.72039794921875, 0.7491836547851562, 0.7779693603515625, 0.8067550659179688, 0.835540771484375, 0.8643264770507812, 0.8931121826171875, 0.9218978881835938, 0.95068359375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 5.0, 4.0, 3.0, 4.0, 4.0, 4.0, 3.0, 7.0, 10.0, 8.0, 8.0, 12.0, 15.0, 15.0, 15.0, 23.0, 26.0, 17.0, 24.0, 31.0, 43.0, 40.0, 42.0, 43.0, 44.0, 48.0, 48.0, 48.0, 30.0, 32.0, 49.0, 39.0, 37.0, 31.0, 30.0, 27.0, 24.0, 20.0, 14.0, 16.0, 11.0, 16.0, 11.0, 6.0, 6.0, 7.0, 6.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.4814453125, -1.430389404296875, -1.37933349609375, -1.328277587890625, -1.2772216796875, -1.226165771484375, -1.17510986328125, -1.124053955078125, -1.072998046875, -1.021942138671875, -0.97088623046875, -0.919830322265625, -0.8687744140625, -0.817718505859375, -0.76666259765625, -0.715606689453125, -0.66455078125, -0.613494873046875, -0.56243896484375, -0.511383056640625, -0.4603271484375, -0.409271240234375, -0.35821533203125, -0.307159423828125, -0.256103515625, -0.205047607421875, -0.15399169921875, -0.102935791015625, -0.0518798828125, -0.000823974609375, 0.05023193359375, 0.101287841796875, 0.15234375, 0.203399658203125, 0.25445556640625, 0.305511474609375, 0.3565673828125, 0.407623291015625, 0.45867919921875, 0.509735107421875, 0.560791015625, 0.611846923828125, 0.66290283203125, 0.713958740234375, 0.7650146484375, 0.816070556640625, 0.86712646484375, 0.918182373046875, 0.96923828125, 1.020294189453125, 1.07135009765625, 1.122406005859375, 1.1734619140625, 1.224517822265625, 1.27557373046875, 1.326629638671875, 1.377685546875, 1.428741455078125, 1.47979736328125, 1.530853271484375, 1.5819091796875, 1.632965087890625, 1.68402099609375, 1.735076904296875, 1.7861328125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 6.0, 6.0, 7.0, 4.0, 8.0, 17.0, 21.0, 25.0, 36.0, 62.0, 104.0, 174.0, 280.0, 508.0, 918.0, 1944.0, 4003.0, 9654.0, 27748.0, 96089.0, 344551.0, 392403.0, 116751.0, 32795.0, 11363.0, 4627.0, 2030.0, 1033.0, 564.0, 340.0, 172.0, 116.0, 63.0, 44.0, 20.0, 23.0, 16.0, 12.0, 15.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.21630859375, -0.21047401428222656, -0.20463943481445312, -0.1988048553466797, -0.19297027587890625, -0.1871356964111328, -0.18130111694335938, -0.17546653747558594, -0.1696319580078125, -0.16379737854003906, -0.15796279907226562, -0.1521282196044922, -0.14629364013671875, -0.1404590606689453, -0.13462448120117188, -0.12878990173339844, -0.122955322265625, -0.11712074279785156, -0.11128616333007812, -0.10545158386230469, -0.09961700439453125, -0.09378242492675781, -0.08794784545898438, -0.08211326599121094, -0.0762786865234375, -0.07044410705566406, -0.06460952758789062, -0.05877494812011719, -0.05294036865234375, -0.04710578918457031, -0.041271209716796875, -0.03543663024902344, -0.02960205078125, -0.023767471313476562, -0.017932891845703125, -0.012098312377929688, -0.00626373291015625, -0.0004291534423828125, 0.005405426025390625, 0.011240005493164062, 0.0170745849609375, 0.022909164428710938, 0.028743743896484375, 0.03457832336425781, 0.04041290283203125, 0.04624748229980469, 0.052082061767578125, 0.05791664123535156, 0.063751220703125, 0.06958580017089844, 0.07542037963867188, 0.08125495910644531, 0.08708953857421875, 0.09292411804199219, 0.09875869750976562, 0.10459327697753906, 0.1104278564453125, 0.11626243591308594, 0.12209701538085938, 0.1279315948486328, 0.13376617431640625, 0.1396007537841797, 0.14543533325195312, 0.15126991271972656, 0.1571044921875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 4.0, 5.0, 3.0, 5.0, 9.0, 10.0, 15.0, 13.0, 14.0, 28.0, 28.0, 44.0, 48.0, 59.0, 91.0, 103.0, 95.0, 81.0, 70.0, 56.0, 36.0, 40.0, 27.0, 22.0, 20.0, 15.0, 12.0, 6.0, 5.0, 9.0, 3.0, 5.0, 5.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.00012302398681640625, -0.00011891871690750122, -0.00011481344699859619, -0.00011070817708969116, -0.00010660290718078613, -0.0001024976372718811, -9.839236736297607e-05, -9.428709745407104e-05, -9.018182754516602e-05, -8.607655763626099e-05, -8.197128772735596e-05, -7.786601781845093e-05, -7.37607479095459e-05, -6.965547800064087e-05, -6.555020809173584e-05, -6.144493818283081e-05, -5.733966827392578e-05, -5.323439836502075e-05, -4.912912845611572e-05, -4.502385854721069e-05, -4.0918588638305664e-05, -3.6813318729400635e-05, -3.2708048820495605e-05, -2.8602778911590576e-05, -2.4497509002685547e-05, -2.0392239093780518e-05, -1.6286969184875488e-05, -1.2181699275970459e-05, -8.07642936706543e-06, -3.9711594581604e-06, 1.341104507446289e-07, 4.239380359649658e-06, 8.344650268554688e-06, 1.2449920177459717e-05, 1.6555190086364746e-05, 2.0660459995269775e-05, 2.4765729904174805e-05, 2.8870999813079834e-05, 3.297626972198486e-05, 3.708153963088989e-05, 4.118680953979492e-05, 4.529207944869995e-05, 4.939734935760498e-05, 5.350261926651001e-05, 5.760788917541504e-05, 6.171315908432007e-05, 6.58184289932251e-05, 6.992369890213013e-05, 7.402896881103516e-05, 7.813423871994019e-05, 8.223950862884521e-05, 8.634477853775024e-05, 9.045004844665527e-05, 9.45553183555603e-05, 9.866058826446533e-05, 0.00010276585817337036, 0.00010687112808227539, 0.00011097639799118042, 0.00011508166790008545, 0.00011918693780899048, 0.0001232922077178955, 0.00012739747762680054, 0.00013150274753570557, 0.0001356080174446106, 0.00013971328735351562]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 2.0, 6.0, 6.0, 7.0, 15.0, 17.0, 43.0, 61.0, 137.0, 288.0, 1027.0, 5710.0, 118456.0, 869512.0, 48432.0, 3619.0, 771.0, 217.0, 100.0, 45.0, 18.0, 24.0, 14.0, 11.0, 8.0, 0.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4765625, -0.45915985107421875, -0.4417572021484375, -0.42435455322265625, -0.406951904296875, -0.38954925537109375, -0.3721466064453125, -0.35474395751953125, -0.33734130859375, -0.31993865966796875, -0.3025360107421875, -0.28513336181640625, -0.267730712890625, -0.25032806396484375, -0.2329254150390625, -0.21552276611328125, -0.1981201171875, -0.18071746826171875, -0.1633148193359375, -0.14591217041015625, -0.128509521484375, -0.11110687255859375, -0.0937042236328125, -0.07630157470703125, -0.05889892578125, -0.04149627685546875, -0.0240936279296875, -0.00669097900390625, 0.010711669921875, 0.02811431884765625, 0.0455169677734375, 0.06291961669921875, 0.080322265625, 0.09772491455078125, 0.1151275634765625, 0.13253021240234375, 0.149932861328125, 0.16733551025390625, 0.1847381591796875, 0.20214080810546875, 0.21954345703125, 0.23694610595703125, 0.2543487548828125, 0.27175140380859375, 0.289154052734375, 0.30655670166015625, 0.3239593505859375, 0.34136199951171875, 0.3587646484375, 0.37616729736328125, 0.3935699462890625, 0.41097259521484375, 0.428375244140625, 0.44577789306640625, 0.4631805419921875, 0.48058319091796875, 0.49798583984375, 0.5153884887695312, 0.5327911376953125, 0.5501937866210938, 0.567596435546875, 0.5849990844726562, 0.6024017333984375, 0.6198043823242188, 0.63720703125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 6.0, 10.0, 14.0, 16.0, 21.0, 31.0, 58.0, 56.0, 73.0, 81.0, 138.0, 113.0, 100.0, 88.0, 59.0, 44.0, 32.0, 20.0, 13.0, 7.0, 6.0, 7.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.080078125, -0.07722663879394531, -0.07437515258789062, -0.07152366638183594, -0.06867218017578125, -0.06582069396972656, -0.06296920776367188, -0.06011772155761719, -0.0572662353515625, -0.05441474914550781, -0.051563262939453125, -0.04871177673339844, -0.04586029052734375, -0.04300880432128906, -0.040157318115234375, -0.03730583190917969, -0.034454345703125, -0.03160285949707031, -0.028751373291015625, -0.025899887084960938, -0.02304840087890625, -0.020196914672851562, -0.017345428466796875, -0.014493942260742188, -0.0116424560546875, -0.008790969848632812, -0.005939483642578125, -0.0030879974365234375, -0.00023651123046875, 0.0026149749755859375, 0.005466461181640625, 0.008317947387695312, 0.01116943359375, 0.014020919799804688, 0.016872406005859375, 0.019723892211914062, 0.02257537841796875, 0.025426864624023438, 0.028278350830078125, 0.031129837036132812, 0.0339813232421875, 0.03683280944824219, 0.039684295654296875, 0.04253578186035156, 0.04538726806640625, 0.04823875427246094, 0.051090240478515625, 0.05394172668457031, 0.056793212890625, 0.05964469909667969, 0.062496185302734375, 0.06534767150878906, 0.06819915771484375, 0.07105064392089844, 0.07390213012695312, 0.07675361633300781, 0.0796051025390625, 0.08245658874511719, 0.08530807495117188, 0.08815956115722656, 0.09101104736328125, 0.09386253356933594, 0.09671401977539062, 0.09956550598144531, 0.1024169921875]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 6.0, 5.0, 15.0, 33.0, 74.0, 158.0, 217.0, 215.0, 164.0, 69.0, 29.0, 19.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.363602638244629, -2.260921001434326, -2.1582393646240234, -2.0555577278137207, -1.952876091003418, -1.8501944541931152, -1.747512698173523, -1.6448310613632202, -1.5421494245529175, -1.4394677877426147, -1.336786150932312, -1.2341043949127197, -1.131422758102417, -1.0287411212921143, -0.9260594844818115, -0.8233778476715088, -0.720696210861206, -0.6180145740509033, -0.5153329372406006, -0.4126512408256531, -0.30996960401535034, -0.2072879672050476, -0.1046062707901001, -0.0019246339797973633, 0.10075700283050537, 0.2034386545419693, 0.3061203062534332, 0.40880197286605835, 0.5114836096763611, 0.6141652464866638, 0.7168469429016113, 0.8195285797119141, 0.9222102165222168, 1.0248918533325195, 1.1275734901428223, 1.230255126953125, 1.3329367637634277, 1.4356184005737305, 1.5383001565933228, 1.6409817934036255, 1.7436634302139282, 1.846345067024231, 1.9490267038345337, 2.051708459854126, 2.1543900966644287, 2.2570717334747314, 2.359753370285034, 2.462435007095337, 2.5651166439056396, 2.6677982807159424, 2.770479917526245, 2.873161554336548, 2.9758431911468506, 3.0785248279571533, 3.181206703186035, 3.283888339996338, 3.3865699768066406, 3.4892516136169434, 3.591933250427246, 3.694614887237549, 3.7972965240478516, 3.8999781608581543, 4.002659797668457, 4.10534143447876, 4.2080230712890625]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 6.0, 7.0, 10.0, 8.0, 9.0, 12.0, 18.0, 24.0, 24.0, 33.0, 21.0, 31.0, 36.0, 35.0, 45.0, 33.0, 64.0, 39.0, 45.0, 45.0, 45.0, 40.0, 30.0, 41.0, 45.0, 23.0, 36.0, 40.0, 25.0, 21.0, 18.0, 16.0, 15.0, 13.0, 12.0, 9.0, 3.0, 2.0, 3.0, 3.0, 3.0, 5.0, 6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7979270219802856, -0.7721570134162903, -0.7463870644569397, -0.7206170558929443, -0.6948471069335938, -0.6690770983695984, -0.643307089805603, -0.6175371408462524, -0.5917671322822571, -0.5659971237182617, -0.5402271747589111, -0.5144571661949158, -0.4886871874332428, -0.4629172086715698, -0.43714720010757446, -0.4113772213459015, -0.3856072425842285, -0.35983726382255554, -0.33406728506088257, -0.3082972764968872, -0.28252729773521423, -0.25675731897354126, -0.2309873253107071, -0.20521733164787292, -0.17944735288619995, -0.15367737412452698, -0.1279073804616928, -0.10213739424943924, -0.07636740803718567, -0.050597429275512695, -0.024827435612678528, 0.0009425580501556396, 0.02671259641647339, 0.05248258262872696, 0.07825256884098053, 0.1040225550532341, 0.12979254126548767, 0.15556252002716064, 0.1813325136899948, 0.20710250735282898, 0.23287248611450195, 0.2586424648761749, 0.2844124436378479, 0.31018245220184326, 0.33595243096351624, 0.3617224097251892, 0.38749241828918457, 0.41326239705085754, 0.4390323758125305, 0.4648023545742035, 0.49057233333587646, 0.5163423418998718, 0.5421123504638672, 0.5678822994232178, 0.5936523079872131, 0.6194223165512085, 0.6451922655105591, 0.6709622740745544, 0.696732223033905, 0.7225022315979004, 0.748272180557251, 0.7740421891212463, 0.7998121976852417, 0.8255821466445923, 0.8513521552085876]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 6.0, 8.0, 3.0, 8.0, 14.0, 21.0, 27.0, 45.0, 68.0, 114.0, 137.0, 202.0, 338.0, 510.0, 824.0, 1433.0, 2427.0, 3846.0, 6787.0, 12136.0, 21624.0, 39585.0, 73263.0, 131965.0, 215522.0, 222356.0, 140589.0, 78571.0, 42610.0, 23151.0, 12772.0, 7202.0, 4062.0, 2405.0, 1472.0, 856.0, 550.0, 349.0, 246.0, 145.0, 107.0, 79.0, 39.0, 22.0, 26.0, 14.0, 9.0, 6.0, 10.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.272705078125, -0.26392364501953125, -0.2551422119140625, -0.24636077880859375, -0.237579345703125, -0.22879791259765625, -0.2200164794921875, -0.21123504638671875, -0.20245361328125, -0.19367218017578125, -0.1848907470703125, -0.17610931396484375, -0.167327880859375, -0.15854644775390625, -0.1497650146484375, -0.14098358154296875, -0.1322021484375, -0.12342071533203125, -0.1146392822265625, -0.10585784912109375, -0.097076416015625, -0.08829498291015625, -0.0795135498046875, -0.07073211669921875, -0.06195068359375, -0.05316925048828125, -0.0443878173828125, -0.03560638427734375, -0.026824951171875, -0.01804351806640625, -0.0092620849609375, -0.00048065185546875, 0.00830078125, 0.01708221435546875, 0.0258636474609375, 0.03464508056640625, 0.043426513671875, 0.05220794677734375, 0.0609893798828125, 0.06977081298828125, 0.07855224609375, 0.08733367919921875, 0.0961151123046875, 0.10489654541015625, 0.113677978515625, 0.12245941162109375, 0.1312408447265625, 0.14002227783203125, 0.1488037109375, 0.15758514404296875, 0.1663665771484375, 0.17514801025390625, 0.183929443359375, 0.19271087646484375, 0.2014923095703125, 0.21027374267578125, 0.21905517578125, 0.22783660888671875, 0.2366180419921875, 0.24539947509765625, 0.254180908203125, 0.26296234130859375, 0.2717437744140625, 0.28052520751953125, 0.289306640625]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 7.0, 4.0, 6.0, 9.0, 7.0, 11.0, 13.0, 14.0, 22.0, 21.0, 34.0, 24.0, 41.0, 26.0, 35.0, 40.0, 52.0, 51.0, 45.0, 47.0, 49.0, 50.0, 46.0, 37.0, 38.0, 35.0, 37.0, 37.0, 30.0, 22.0, 14.0, 18.0, 14.0, 20.0, 12.0, 8.0, 6.0, 11.0, 5.0, 1.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.47265625, -4.33587646484375, -4.1990966796875, -4.06231689453125, -3.925537109375, -3.78875732421875, -3.6519775390625, -3.51519775390625, -3.37841796875, -3.24163818359375, -3.1048583984375, -2.96807861328125, -2.831298828125, -2.69451904296875, -2.5577392578125, -2.42095947265625, -2.2841796875, -2.14739990234375, -2.0106201171875, -1.87384033203125, -1.737060546875, -1.60028076171875, -1.4635009765625, -1.32672119140625, -1.18994140625, -1.05316162109375, -0.9163818359375, -0.77960205078125, -0.642822265625, -0.50604248046875, -0.3692626953125, -0.23248291015625, -0.095703125, 0.04107666015625, 0.1778564453125, 0.31463623046875, 0.451416015625, 0.58819580078125, 0.7249755859375, 0.86175537109375, 0.99853515625, 1.13531494140625, 1.2720947265625, 1.40887451171875, 1.545654296875, 1.68243408203125, 1.8192138671875, 1.95599365234375, 2.0927734375, 2.22955322265625, 2.3663330078125, 2.50311279296875, 2.639892578125, 2.77667236328125, 2.9134521484375, 3.05023193359375, 3.18701171875, 3.32379150390625, 3.4605712890625, 3.59735107421875, 3.734130859375, 3.87091064453125, 4.0076904296875, 4.14447021484375, 4.28125]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 8.0, 7.0, 8.0, 8.0, 11.0, 13.0, 25.0, 15.0, 25.0, 32.0, 50.0, 47.0, 60.0, 75.0, 100.0, 138.0, 228.0, 386.0, 1035.0, 7498.0, 693518.0, 338703.0, 4590.0, 839.0, 382.0, 206.0, 126.0, 91.0, 62.0, 44.0, 46.0, 32.0, 36.0, 35.0, 15.0, 8.0, 9.0, 8.0, 11.0, 5.0, 7.0, 5.0, 3.0, 4.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.328125, -2.24761962890625, -2.1671142578125, -2.08660888671875, -2.006103515625, -1.92559814453125, -1.8450927734375, -1.76458740234375, -1.68408203125, -1.60357666015625, -1.5230712890625, -1.44256591796875, -1.362060546875, -1.28155517578125, -1.2010498046875, -1.12054443359375, -1.0400390625, -0.95953369140625, -0.8790283203125, -0.79852294921875, -0.718017578125, -0.63751220703125, -0.5570068359375, -0.47650146484375, -0.39599609375, -0.31549072265625, -0.2349853515625, -0.15447998046875, -0.073974609375, 0.00653076171875, 0.0870361328125, 0.16754150390625, 0.248046875, 0.32855224609375, 0.4090576171875, 0.48956298828125, 0.570068359375, 0.65057373046875, 0.7310791015625, 0.81158447265625, 0.89208984375, 0.97259521484375, 1.0531005859375, 1.13360595703125, 1.214111328125, 1.29461669921875, 1.3751220703125, 1.45562744140625, 1.5361328125, 1.61663818359375, 1.6971435546875, 1.77764892578125, 1.858154296875, 1.93865966796875, 2.0191650390625, 2.09967041015625, 2.18017578125, 2.26068115234375, 2.3411865234375, 2.42169189453125, 2.502197265625, 2.58270263671875, 2.6632080078125, 2.74371337890625, 2.82421875]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 6.0, 7.0, 5.0, 9.0, 13.0, 12.0, 17.0, 17.0, 21.0, 28.0, 32.0, 24.0, 31.0, 24.0, 38.0, 40.0, 43.0, 42.0, 38.0, 39.0, 42.0, 40.0, 38.0, 34.0, 41.0, 44.0, 27.0, 36.0, 24.0, 23.0, 22.0, 24.0, 26.0, 24.0, 10.0, 8.0, 6.0, 9.0, 12.0, 9.0, 3.0, 3.0, 6.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.609375, -3.483642578125, -3.35791015625, -3.232177734375, -3.1064453125, -2.980712890625, -2.85498046875, -2.729248046875, -2.603515625, -2.477783203125, -2.35205078125, -2.226318359375, -2.1005859375, -1.974853515625, -1.84912109375, -1.723388671875, -1.59765625, -1.471923828125, -1.34619140625, -1.220458984375, -1.0947265625, -0.968994140625, -0.84326171875, -0.717529296875, -0.591796875, -0.466064453125, -0.34033203125, -0.214599609375, -0.0888671875, 0.036865234375, 0.16259765625, 0.288330078125, 0.4140625, 0.539794921875, 0.66552734375, 0.791259765625, 0.9169921875, 1.042724609375, 1.16845703125, 1.294189453125, 1.419921875, 1.545654296875, 1.67138671875, 1.797119140625, 1.9228515625, 2.048583984375, 2.17431640625, 2.300048828125, 2.42578125, 2.551513671875, 2.67724609375, 2.802978515625, 2.9287109375, 3.054443359375, 3.18017578125, 3.305908203125, 3.431640625, 3.557373046875, 3.68310546875, 3.808837890625, 3.9345703125, 4.060302734375, 4.18603515625, 4.311767578125, 4.4375]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 6.0, 0.0, 2.0, 8.0, 12.0, 12.0, 23.0, 33.0, 46.0, 73.0, 93.0, 186.0, 273.0, 543.0, 1068.0, 2299.0, 5643.0, 18151.0, 77801.0, 642498.0, 241609.0, 40055.0, 10814.0, 3850.0, 1591.0, 795.0, 430.0, 255.0, 152.0, 63.0, 57.0, 42.0, 24.0, 15.0, 13.0, 13.0, 3.0, 6.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.1363525390625, -0.1320629119873047, -0.12777328491210938, -0.12348365783691406, -0.11919403076171875, -0.11490440368652344, -0.11061477661132812, -0.10632514953613281, -0.1020355224609375, -0.09774589538574219, -0.09345626831054688, -0.08916664123535156, -0.08487701416015625, -0.08058738708496094, -0.07629776000976562, -0.07200813293457031, -0.067718505859375, -0.06342887878417969, -0.059139251708984375, -0.05484962463378906, -0.05055999755859375, -0.04627037048339844, -0.041980743408203125, -0.03769111633300781, -0.0334014892578125, -0.029111862182617188, -0.024822235107421875, -0.020532608032226562, -0.01624298095703125, -0.011953353881835938, -0.007663726806640625, -0.0033740997314453125, 0.00091552734375, 0.0052051544189453125, 0.009494781494140625, 0.013784408569335938, 0.01807403564453125, 0.022363662719726562, 0.026653289794921875, 0.030942916870117188, 0.0352325439453125, 0.03952217102050781, 0.043811798095703125, 0.04810142517089844, 0.05239105224609375, 0.05668067932128906, 0.060970306396484375, 0.06525993347167969, 0.069549560546875, 0.07383918762207031, 0.07812881469726562, 0.08241844177246094, 0.08670806884765625, 0.09099769592285156, 0.09528732299804688, 0.09957695007324219, 0.1038665771484375, 0.10815620422363281, 0.11244583129882812, 0.11673545837402344, 0.12102508544921875, 0.12531471252441406, 0.12960433959960938, 0.1338939666748047, 0.13818359375]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 6.0, 9.0, 16.0, 26.0, 39.0, 60.0, 128.0, 240.0, 217.0, 114.0, 55.0, 30.0, 21.0, 17.0, 7.0, 6.0, 0.0, 7.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.2988529205322266e-05, -5.1625072956085205e-05, -5.0261616706848145e-05, -4.8898160457611084e-05, -4.7534704208374023e-05, -4.617124795913696e-05, -4.48077917098999e-05, -4.344433546066284e-05, -4.208087921142578e-05, -4.071742296218872e-05, -3.935396671295166e-05, -3.79905104637146e-05, -3.662705421447754e-05, -3.526359796524048e-05, -3.390014171600342e-05, -3.253668546676636e-05, -3.11732292175293e-05, -2.9809772968292236e-05, -2.8446316719055176e-05, -2.7082860469818115e-05, -2.5719404220581055e-05, -2.4355947971343994e-05, -2.2992491722106934e-05, -2.1629035472869873e-05, -2.0265579223632812e-05, -1.8902122974395752e-05, -1.753866672515869e-05, -1.617521047592163e-05, -1.481175422668457e-05, -1.344829797744751e-05, -1.208484172821045e-05, -1.0721385478973389e-05, -9.357929229736328e-06, -7.994472980499268e-06, -6.631016731262207e-06, -5.2675604820251465e-06, -3.904104232788086e-06, -2.5406479835510254e-06, -1.1771917343139648e-06, 1.862645149230957e-07, 1.5497207641601562e-06, 2.913177013397217e-06, 4.276633262634277e-06, 5.640089511871338e-06, 7.0035457611083984e-06, 8.367002010345459e-06, 9.73045825958252e-06, 1.109391450881958e-05, 1.245737075805664e-05, 1.3820827007293701e-05, 1.5184283256530762e-05, 1.6547739505767822e-05, 1.7911195755004883e-05, 1.9274652004241943e-05, 2.0638108253479004e-05, 2.2001564502716064e-05, 2.3365020751953125e-05, 2.4728477001190186e-05, 2.6091933250427246e-05, 2.7455389499664307e-05, 2.8818845748901367e-05, 3.0182301998138428e-05, 3.154575824737549e-05, 3.290921449661255e-05, 3.427267074584961e-05]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 2.0, 5.0, 4.0, 10.0, 22.0, 32.0, 32.0, 53.0, 61.0, 114.0, 150.0, 253.0, 411.0, 757.0, 1712.0, 4209.0, 13126.0, 49936.0, 349796.0, 538678.0, 63976.0, 16055.0, 4979.0, 1981.0, 929.0, 450.0, 298.0, 161.0, 127.0, 66.0, 43.0, 54.0, 24.0, 14.0, 13.0, 5.0, 5.0, 6.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.1378173828125, -0.1336517333984375, -0.129486083984375, -0.1253204345703125, -0.12115478515625, -0.1169891357421875, -0.112823486328125, -0.1086578369140625, -0.1044921875, -0.1003265380859375, -0.096160888671875, -0.0919952392578125, -0.08782958984375, -0.0836639404296875, -0.079498291015625, -0.0753326416015625, -0.0711669921875, -0.0670013427734375, -0.062835693359375, -0.0586700439453125, -0.05450439453125, -0.0503387451171875, -0.046173095703125, -0.0420074462890625, -0.037841796875, -0.0336761474609375, -0.029510498046875, -0.0253448486328125, -0.02117919921875, -0.0170135498046875, -0.012847900390625, -0.0086822509765625, -0.0045166015625, -0.0003509521484375, 0.003814697265625, 0.0079803466796875, 0.01214599609375, 0.0163116455078125, 0.020477294921875, 0.0246429443359375, 0.02880859375, 0.0329742431640625, 0.037139892578125, 0.0413055419921875, 0.04547119140625, 0.0496368408203125, 0.053802490234375, 0.0579681396484375, 0.0621337890625, 0.0662994384765625, 0.070465087890625, 0.0746307373046875, 0.07879638671875, 0.0829620361328125, 0.087127685546875, 0.0912933349609375, 0.095458984375, 0.0996246337890625, 0.103790283203125, 0.1079559326171875, 0.11212158203125, 0.1162872314453125, 0.120452880859375, 0.1246185302734375, 0.1287841796875]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 7.0, 5.0, 6.0, 5.0, 7.0, 15.0, 16.0, 25.0, 15.0, 30.0, 23.0, 46.0, 71.0, 96.0, 134.0, 132.0, 107.0, 71.0, 43.0, 28.0, 29.0, 15.0, 12.0, 9.0, 13.0, 12.0, 4.0, 9.0, 4.0, 5.0, 4.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04718017578125, -0.04583597183227539, -0.04449176788330078, -0.04314756393432617, -0.04180335998535156, -0.04045915603637695, -0.039114952087402344, -0.037770748138427734, -0.036426544189453125, -0.035082340240478516, -0.033738136291503906, -0.0323939323425293, -0.031049728393554688, -0.029705524444580078, -0.02836132049560547, -0.02701711654663086, -0.02567291259765625, -0.02432870864868164, -0.02298450469970703, -0.021640300750732422, -0.020296096801757812, -0.018951892852783203, -0.017607688903808594, -0.016263484954833984, -0.014919281005859375, -0.013575077056884766, -0.012230873107910156, -0.010886669158935547, -0.009542465209960938, -0.008198261260986328, -0.006854057312011719, -0.005509853363037109, -0.0041656494140625, -0.0028214454650878906, -0.0014772415161132812, -0.00013303756713867188, 0.0012111663818359375, 0.002555370330810547, 0.0038995742797851562, 0.005243778228759766, 0.006587982177734375, 0.007932186126708984, 0.009276390075683594, 0.010620594024658203, 0.011964797973632812, 0.013309001922607422, 0.014653205871582031, 0.01599740982055664, 0.01734161376953125, 0.01868581771850586, 0.02003002166748047, 0.021374225616455078, 0.022718429565429688, 0.024062633514404297, 0.025406837463378906, 0.026751041412353516, 0.028095245361328125, 0.029439449310302734, 0.030783653259277344, 0.03212785720825195, 0.03347206115722656, 0.03481626510620117, 0.03616046905517578, 0.03750467300415039, 0.038848876953125]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 50.0, 629.0, 325.0, 17.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.586158752441406, -35.9533805847168, -35.32060241699219, -34.68782424926758, -34.05504608154297, -33.422271728515625, -32.789493560791016, -32.156715393066406, -31.523937225341797, -30.891159057617188, -30.258380889892578, -29.6256046295166, -28.992826461791992, -28.360048294067383, -27.727270126342773, -27.094491958618164, -26.461713790893555, -25.828935623168945, -25.196157455444336, -24.56338119506836, -23.93060302734375, -23.29782485961914, -22.66504669189453, -22.032268524169922, -21.399490356445312, -20.766712188720703, -20.133934020996094, -19.501157760620117, -18.868379592895508, -18.2356014251709, -17.60282325744629, -16.97004508972168, -16.33726692199707, -15.704488754272461, -15.071711540222168, -14.438933372497559, -13.806156158447266, -13.173377990722656, -12.540599822998047, -11.907821655273438, -11.275044441223145, -10.642266273498535, -10.009489059448242, -9.376710891723633, -8.743932723999023, -8.11115550994873, -7.478377342224121, -6.84559965133667, -6.212821960449219, -5.580044269561768, -4.947266578674316, -4.314488410949707, -3.681710720062256, -3.0489330291748047, -2.4161550998687744, -1.7833771705627441, -1.150599479675293, -0.5178216695785522, 0.11495614051818848, 0.7477339506149292, 1.38051176071167, 2.013289451599121, 2.6460673809051514, 3.2788453102111816, 3.911623001098633]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 6.0, 3.0, 5.0, 0.0, 4.0, 10.0, 6.0, 19.0, 13.0, 20.0, 16.0, 12.0, 22.0, 21.0, 34.0, 37.0, 40.0, 25.0, 31.0, 34.0, 33.0, 38.0, 48.0, 39.0, 36.0, 32.0, 36.0, 45.0, 37.0, 36.0, 36.0, 31.0, 16.0, 23.0, 31.0, 22.0, 27.0, 15.0, 11.0, 13.0, 6.0, 5.0, 3.0, 2.0, 7.0, 6.0, 5.0, 1.0, 3.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0], "bins": [-5.821846961975098, -5.630846977233887, -5.439846992492676, -5.248847007751465, -5.057846546173096, -4.866846561431885, -4.675846576690674, -4.484846591949463, -4.293846130371094, -4.102846145629883, -3.9118459224700928, -3.720845937728882, -3.529845714569092, -3.338845729827881, -3.14784574508667, -2.956845760345459, -2.765845775604248, -2.574845790863037, -2.383845567703247, -2.192845582962036, -2.001845359802246, -1.8108453750610352, -1.6198453903198242, -1.4288452863693237, -1.2378451824188232, -1.0468450784683228, -0.855845034122467, -0.6648449897766113, -0.47384488582611084, -0.28284478187561035, -0.09184479713439941, 0.09915530681610107, 0.29015541076660156, 0.48115548491477966, 0.6721555590629578, 0.8631556034088135, 1.054155707359314, 1.2451558113098145, 1.4361557960510254, 1.6271559000015259, 1.8181560039520264, 2.0091559886932373, 2.2001562118530273, 2.3911561965942383, 2.582156181335449, 2.7731564044952393, 2.96415638923645, 3.1551566123962402, 3.346156597137451, 3.537156581878662, 3.728156805038452, 3.919156789779663, 4.110157012939453, 4.301156997680664, 4.492156982421875, 4.683156967163086, 4.874156951904297, 5.065156936645508, 5.256156921386719, 5.44715690612793, 5.638157367706299, 5.82915735244751, 6.020157337188721, 6.211157321929932, 6.402157783508301]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 5.0, 9.0, 1.0, 8.0, 4.0, 10.0, 9.0, 16.0, 14.0, 14.0, 29.0, 23.0, 30.0, 65.0, 89.0, 148.0, 277.0, 697.0, 1816.0, 7267.0, 35438.0, 429631.0, 2797194.0, 845991.0, 61685.0, 9562.0, 2529.0, 855.0, 348.0, 174.0, 90.0, 44.0, 39.0, 35.0, 34.0, 22.0, 16.0, 13.0, 11.0, 6.0, 6.0, 9.0, 5.0, 7.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0], "bins": [-1.923828125, -1.8666229248046875, -1.809417724609375, -1.7522125244140625, -1.69500732421875, -1.6378021240234375, -1.580596923828125, -1.5233917236328125, -1.4661865234375, -1.4089813232421875, -1.351776123046875, -1.2945709228515625, -1.23736572265625, -1.1801605224609375, -1.122955322265625, -1.0657501220703125, -1.008544921875, -0.9513397216796875, -0.894134521484375, -0.8369293212890625, -0.77972412109375, -0.7225189208984375, -0.665313720703125, -0.6081085205078125, -0.5509033203125, -0.4936981201171875, -0.436492919921875, -0.3792877197265625, -0.32208251953125, -0.2648773193359375, -0.207672119140625, -0.1504669189453125, -0.09326171875, -0.0360565185546875, 0.021148681640625, 0.0783538818359375, 0.13555908203125, 0.1927642822265625, 0.249969482421875, 0.3071746826171875, 0.3643798828125, 0.4215850830078125, 0.478790283203125, 0.5359954833984375, 0.59320068359375, 0.6504058837890625, 0.707611083984375, 0.7648162841796875, 0.822021484375, 0.8792266845703125, 0.936431884765625, 0.9936370849609375, 1.05084228515625, 1.1080474853515625, 1.165252685546875, 1.2224578857421875, 1.2796630859375, 1.3368682861328125, 1.394073486328125, 1.4512786865234375, 1.50848388671875, 1.5656890869140625, 1.622894287109375, 1.6800994873046875, 1.7373046875]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 4.0, 8.0, 11.0, 13.0, 9.0, 15.0, 28.0, 30.0, 38.0, 53.0, 47.0, 55.0, 58.0, 52.0, 74.0, 60.0, 57.0, 57.0, 55.0, 57.0, 46.0, 41.0, 28.0, 25.0, 22.0, 11.0, 16.0, 13.0, 4.0, 5.0, 5.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.94140625, -0.9024200439453125, -0.863433837890625, -0.8244476318359375, -0.78546142578125, -0.7464752197265625, -0.707489013671875, -0.6685028076171875, -0.6295166015625, -0.5905303955078125, -0.551544189453125, -0.5125579833984375, -0.47357177734375, -0.4345855712890625, -0.395599365234375, -0.3566131591796875, -0.317626953125, -0.2786407470703125, -0.239654541015625, -0.2006683349609375, -0.16168212890625, -0.1226959228515625, -0.083709716796875, -0.0447235107421875, -0.0057373046875, 0.0332489013671875, 0.072235107421875, 0.1112213134765625, 0.15020751953125, 0.1891937255859375, 0.228179931640625, 0.2671661376953125, 0.30615234375, 0.3451385498046875, 0.384124755859375, 0.4231109619140625, 0.46209716796875, 0.5010833740234375, 0.540069580078125, 0.5790557861328125, 0.6180419921875, 0.6570281982421875, 0.696014404296875, 0.7350006103515625, 0.77398681640625, 0.8129730224609375, 0.851959228515625, 0.8909454345703125, 0.929931640625, 0.9689178466796875, 1.007904052734375, 1.0468902587890625, 1.08587646484375, 1.1248626708984375, 1.163848876953125, 1.2028350830078125, 1.2418212890625, 1.2808074951171875, 1.319793701171875, 1.3587799072265625, 1.39776611328125, 1.4367523193359375, 1.475738525390625, 1.5147247314453125, 1.5537109375]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 7.0, 8.0, 27.0, 48.0, 179.0, 2471573.0, 1722150.0, 178.0, 52.0, 18.0, 16.0, 7.0, 4.0, 4.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-39.1875, -38.25439453125, -37.3212890625, -36.38818359375, -35.455078125, -34.52197265625, -33.5888671875, -32.65576171875, -31.72265625, -30.78955078125, -29.8564453125, -28.92333984375, -27.990234375, -27.05712890625, -26.1240234375, -25.19091796875, -24.2578125, -23.32470703125, -22.3916015625, -21.45849609375, -20.525390625, -19.59228515625, -18.6591796875, -17.72607421875, -16.79296875, -15.85986328125, -14.9267578125, -13.99365234375, -13.060546875, -12.12744140625, -11.1943359375, -10.26123046875, -9.328125, -8.39501953125, -7.4619140625, -6.52880859375, -5.595703125, -4.66259765625, -3.7294921875, -2.79638671875, -1.86328125, -0.93017578125, 0.0029296875, 0.93603515625, 1.869140625, 2.80224609375, 3.7353515625, 4.66845703125, 5.6015625, 6.53466796875, 7.4677734375, 8.40087890625, 9.333984375, 10.26708984375, 11.2001953125, 12.13330078125, 13.06640625, 13.99951171875, 14.9326171875, 15.86572265625, 16.798828125, 17.73193359375, 18.6650390625, 19.59814453125, 20.53125]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 7.0, 17.0, 22.0, 43.0, 77.0, 144.0, 313.0, 789.0, 1232.0, 767.0, 323.0, 170.0, 72.0, 35.0, 28.0, 13.0, 8.0, 5.0, 3.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.94873046875, -0.9240646362304688, -0.8993988037109375, -0.8747329711914062, -0.850067138671875, -0.8254013061523438, -0.8007354736328125, -0.7760696411132812, -0.75140380859375, -0.7267379760742188, -0.7020721435546875, -0.6774063110351562, -0.652740478515625, -0.6280746459960938, -0.6034088134765625, -0.5787429809570312, -0.5540771484375, -0.5294113159179688, -0.5047454833984375, -0.48007965087890625, -0.455413818359375, -0.43074798583984375, -0.4060821533203125, -0.38141632080078125, -0.35675048828125, -0.33208465576171875, -0.3074188232421875, -0.28275299072265625, -0.258087158203125, -0.23342132568359375, -0.2087554931640625, -0.18408966064453125, -0.159423828125, -0.13475799560546875, -0.1100921630859375, -0.08542633056640625, -0.060760498046875, -0.03609466552734375, -0.0114288330078125, 0.01323699951171875, 0.03790283203125, 0.06256866455078125, 0.0872344970703125, 0.11190032958984375, 0.136566162109375, 0.16123199462890625, 0.1858978271484375, 0.21056365966796875, 0.2352294921875, 0.25989532470703125, 0.2845611572265625, 0.30922698974609375, 0.333892822265625, 0.35855865478515625, 0.3832244873046875, 0.40789031982421875, 0.43255615234375, 0.45722198486328125, 0.4818878173828125, 0.5065536499023438, 0.531219482421875, 0.5558853149414062, 0.5805511474609375, 0.6052169799804688, 0.6298828125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 5.0, 5.0, 5.0, 14.0, 11.0, 17.0, 36.0, 34.0, 41.0, 70.0, 72.0, 66.0, 92.0, 88.0, 80.0, 89.0, 71.0, 55.0, 47.0, 17.0, 28.0, 20.0, 13.0, 12.0, 8.0, 2.0, 6.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4012956619262695, -1.3553353548049927, -1.3093749284744263, -1.2634146213531494, -1.217454195022583, -1.1714938879013062, -1.1255335807800293, -1.079573154449463, -1.0336127281188965, -0.9876523613929749, -0.9416919946670532, -0.8957316875457764, -0.84977126121521, -0.8038109540939331, -0.7578505873680115, -0.7118902206420898, -0.665929913520813, -0.6199695467948914, -0.5740091800689697, -0.5280488729476929, -0.48208847641944885, -0.4361281096935272, -0.390167772769928, -0.34420740604400635, -0.2982470393180847, -0.2522866725921631, -0.20632632076740265, -0.1603659689426422, -0.11440560221672058, -0.06844523549079895, -0.022484898567199707, 0.023475468158721924, 0.0694359540939331, 0.11539631336927414, 0.16135667264461517, 0.2073170244693756, 0.25327739119529724, 0.29923775792121887, 0.3451980948448181, 0.39115846157073975, 0.4371188282966614, 0.483079195022583, 0.5290395617485046, 0.5749999284744263, 0.6209602355957031, 0.6669206619262695, 0.7128809690475464, 0.758841335773468, 0.8048017024993896, 0.8507620692253113, 0.8967224359512329, 0.9426827430725098, 0.9886431694030762, 1.034603476524353, 1.0805637836456299, 1.1265242099761963, 1.1724846363067627, 1.2184449434280396, 1.264405369758606, 1.3103656768798828, 1.3563261032104492, 1.402286410331726, 1.448246717453003, 1.4942071437835693, 1.5401674509048462]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 6.0, 3.0, 2.0, 3.0, 5.0, 5.0, 5.0, 15.0, 18.0, 15.0, 18.0, 18.0, 20.0, 30.0, 39.0, 30.0, 30.0, 21.0, 37.0, 34.0, 48.0, 43.0, 49.0, 46.0, 48.0, 52.0, 41.0, 52.0, 30.0, 35.0, 19.0, 25.0, 38.0, 22.0, 19.0, 15.0, 15.0, 18.0, 8.0, 10.0, 10.0, 5.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8428260684013367, -0.8140411972999573, -0.7852563261985779, -0.7564714550971985, -0.7276865839958191, -0.6989017128944397, -0.6701167821884155, -0.6413319110870361, -0.6125470399856567, -0.5837621688842773, -0.554977297782898, -0.5261924266815186, -0.49740755558013916, -0.46862268447875977, -0.439837783575058, -0.4110529124736786, -0.3822680711746216, -0.3534832000732422, -0.3246983289718628, -0.2959134578704834, -0.267128586769104, -0.23834370076656342, -0.20955881476402283, -0.18077394366264343, -0.15198907256126404, -0.12320420145988464, -0.09441932290792465, -0.06563444435596466, -0.036849573254585266, -0.008064702153205872, 0.020720183849334717, 0.04950505495071411, 0.0782899260520935, 0.1070747971534729, 0.1358596682548523, 0.16464455425739288, 0.19342942535877228, 0.22221429646015167, 0.25099918246269226, 0.27978405356407166, 0.30856892466545105, 0.33735379576683044, 0.36613866686820984, 0.3949235677719116, 0.423708438873291, 0.4524933099746704, 0.4812781810760498, 0.5100630521774292, 0.5388479232788086, 0.567632794380188, 0.5964176654815674, 0.6252025365829468, 0.6539874076843262, 0.6827722787857056, 0.711557149887085, 0.7403420209884644, 0.7691268920898438, 0.7979117631912231, 0.8266966342926025, 0.8554815053939819, 0.8842663764953613, 0.9130512475967407, 0.9418361186981201, 0.9706209897994995, 0.9994059205055237]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 3.0, 2.0, 2.0, 5.0, 6.0, 11.0, 17.0, 30.0, 45.0, 55.0, 76.0, 143.0, 225.0, 405.0, 660.0, 1075.0, 1864.0, 3419.0, 6358.0, 12090.0, 23906.0, 49893.0, 110366.0, 242432.0, 300603.0, 157497.0, 69962.0, 32661.0, 16078.0, 8386.0, 4567.0, 2396.0, 1345.0, 773.0, 456.0, 279.0, 173.0, 106.0, 74.0, 48.0, 20.0, 20.0, 8.0, 10.0, 6.0, 7.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.362548828125, -0.3492279052734375, -0.335906982421875, -0.3225860595703125, -0.30926513671875, -0.2959442138671875, -0.282623291015625, -0.2693023681640625, -0.2559814453125, -0.2426605224609375, -0.229339599609375, -0.2160186767578125, -0.20269775390625, -0.1893768310546875, -0.176055908203125, -0.1627349853515625, -0.1494140625, -0.1360931396484375, -0.122772216796875, -0.1094512939453125, -0.09613037109375, -0.0828094482421875, -0.069488525390625, -0.0561676025390625, -0.0428466796875, -0.0295257568359375, -0.016204833984375, -0.0028839111328125, 0.01043701171875, 0.0237579345703125, 0.037078857421875, 0.0503997802734375, 0.063720703125, 0.0770416259765625, 0.090362548828125, 0.1036834716796875, 0.11700439453125, 0.1303253173828125, 0.143646240234375, 0.1569671630859375, 0.1702880859375, 0.1836090087890625, 0.196929931640625, 0.2102508544921875, 0.22357177734375, 0.2368927001953125, 0.250213623046875, 0.2635345458984375, 0.27685546875, 0.2901763916015625, 0.303497314453125, 0.3168182373046875, 0.33013916015625, 0.3434600830078125, 0.356781005859375, 0.3701019287109375, 0.3834228515625, 0.3967437744140625, 0.410064697265625, 0.4233856201171875, 0.43670654296875, 0.4500274658203125, 0.463348388671875, 0.4766693115234375, 0.489990234375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 5.0, 3.0, 4.0, 2.0, 13.0, 14.0, 17.0, 17.0, 19.0, 25.0, 24.0, 38.0, 34.0, 50.0, 56.0, 38.0, 39.0, 51.0, 44.0, 60.0, 57.0, 47.0, 46.0, 38.0, 46.0, 37.0, 31.0, 26.0, 26.0, 20.0, 18.0, 19.0, 9.0, 12.0, 5.0, 7.0, 5.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.60595703125, -0.5836029052734375, -0.561248779296875, -0.5388946533203125, -0.51654052734375, -0.4941864013671875, -0.471832275390625, -0.4494781494140625, -0.4271240234375, -0.4047698974609375, -0.382415771484375, -0.3600616455078125, -0.33770751953125, -0.3153533935546875, -0.292999267578125, -0.2706451416015625, -0.248291015625, -0.2259368896484375, -0.203582763671875, -0.1812286376953125, -0.15887451171875, -0.1365203857421875, -0.114166259765625, -0.0918121337890625, -0.0694580078125, -0.0471038818359375, -0.024749755859375, -0.0023956298828125, 0.01995849609375, 0.0423126220703125, 0.064666748046875, 0.0870208740234375, 0.109375, 0.1317291259765625, 0.154083251953125, 0.1764373779296875, 0.19879150390625, 0.2211456298828125, 0.243499755859375, 0.2658538818359375, 0.2882080078125, 0.3105621337890625, 0.332916259765625, 0.3552703857421875, 0.37762451171875, 0.3999786376953125, 0.422332763671875, 0.4446868896484375, 0.467041015625, 0.4893951416015625, 0.511749267578125, 0.5341033935546875, 0.55645751953125, 0.5788116455078125, 0.601165771484375, 0.6235198974609375, 0.6458740234375, 0.6682281494140625, 0.690582275390625, 0.7129364013671875, 0.73529052734375, 0.7576446533203125, 0.779998779296875, 0.8023529052734375, 0.82470703125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 3.0, 6.0, 14.0, 8.0, 12.0, 25.0, 24.0, 45.0, 83.0, 106.0, 185.0, 280.0, 490.0, 972.0, 1872.0, 4010.0, 9404.0, 23813.0, 66248.0, 188819.0, 373466.0, 240522.0, 85921.0, 30576.0, 11867.0, 4976.0, 2229.0, 1080.0, 581.0, 353.0, 205.0, 133.0, 85.0, 52.0, 31.0, 25.0, 15.0, 8.0, 3.0, 4.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.54296875, -0.5281448364257812, -0.5133209228515625, -0.49849700927734375, -0.483673095703125, -0.46884918212890625, -0.4540252685546875, -0.43920135498046875, -0.42437744140625, -0.40955352783203125, -0.3947296142578125, -0.37990570068359375, -0.365081787109375, -0.35025787353515625, -0.3354339599609375, -0.32061004638671875, -0.3057861328125, -0.29096221923828125, -0.2761383056640625, -0.26131439208984375, -0.246490478515625, -0.23166656494140625, -0.2168426513671875, -0.20201873779296875, -0.18719482421875, -0.17237091064453125, -0.1575469970703125, -0.14272308349609375, -0.127899169921875, -0.11307525634765625, -0.0982513427734375, -0.08342742919921875, -0.068603515625, -0.05377960205078125, -0.0389556884765625, -0.02413177490234375, -0.009307861328125, 0.00551605224609375, 0.0203399658203125, 0.03516387939453125, 0.04998779296875, 0.06481170654296875, 0.0796356201171875, 0.09445953369140625, 0.109283447265625, 0.12410736083984375, 0.1389312744140625, 0.15375518798828125, 0.1685791015625, 0.18340301513671875, 0.1982269287109375, 0.21305084228515625, 0.227874755859375, 0.24269866943359375, 0.2575225830078125, 0.27234649658203125, 0.28717041015625, 0.30199432373046875, 0.3168182373046875, 0.33164215087890625, 0.346466064453125, 0.36128997802734375, 0.3761138916015625, 0.39093780517578125, 0.40576171875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 5.0, 3.0, 5.0, 6.0, 13.0, 9.0, 11.0, 21.0, 30.0, 23.0, 31.0, 29.0, 25.0, 51.0, 36.0, 35.0, 50.0, 59.0, 55.0, 54.0, 45.0, 33.0, 42.0, 40.0, 39.0, 41.0, 48.0, 24.0, 20.0, 23.0, 18.0, 11.0, 17.0, 13.0, 10.0, 4.0, 8.0, 2.0, 5.0, 5.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0927734375, -1.0533294677734375, -1.013885498046875, -0.9744415283203125, -0.93499755859375, -0.8955535888671875, -0.856109619140625, -0.8166656494140625, -0.7772216796875, -0.7377777099609375, -0.698333740234375, -0.6588897705078125, -0.61944580078125, -0.5800018310546875, -0.540557861328125, -0.5011138916015625, -0.461669921875, -0.4222259521484375, -0.382781982421875, -0.3433380126953125, -0.30389404296875, -0.2644500732421875, -0.225006103515625, -0.1855621337890625, -0.1461181640625, -0.1066741943359375, -0.067230224609375, -0.0277862548828125, 0.01165771484375, 0.0511016845703125, 0.090545654296875, 0.1299896240234375, 0.16943359375, 0.2088775634765625, 0.248321533203125, 0.2877655029296875, 0.32720947265625, 0.3666534423828125, 0.406097412109375, 0.4455413818359375, 0.4849853515625, 0.5244293212890625, 0.563873291015625, 0.6033172607421875, 0.64276123046875, 0.6822052001953125, 0.721649169921875, 0.7610931396484375, 0.800537109375, 0.8399810791015625, 0.879425048828125, 0.9188690185546875, 0.95831298828125, 0.9977569580078125, 1.037200927734375, 1.0766448974609375, 1.1160888671875, 1.1555328369140625, 1.194976806640625, 1.2344207763671875, 1.27386474609375, 1.3133087158203125, 1.352752685546875, 1.3921966552734375, 1.431640625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 1.0, 7.0, 13.0, 10.0, 19.0, 11.0, 32.0, 35.0, 45.0, 99.0, 149.0, 253.0, 380.0, 588.0, 955.0, 1747.0, 3359.0, 6390.0, 13362.0, 30336.0, 73600.0, 174878.0, 313032.0, 240968.0, 107368.0, 43852.0, 18589.0, 8668.0, 4332.0, 2187.0, 1310.0, 730.0, 476.0, 284.0, 144.0, 91.0, 81.0, 55.0, 39.0, 28.0, 21.0, 11.0, 11.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0], "bins": [-0.0863037109375, -0.0838174819946289, -0.08133125305175781, -0.07884502410888672, -0.07635879516601562, -0.07387256622314453, -0.07138633728027344, -0.06890010833740234, -0.06641387939453125, -0.06392765045166016, -0.06144142150878906, -0.05895519256591797, -0.056468963623046875, -0.05398273468017578, -0.05149650573730469, -0.049010276794433594, -0.0465240478515625, -0.044037818908691406, -0.04155158996582031, -0.03906536102294922, -0.036579132080078125, -0.03409290313720703, -0.03160667419433594, -0.029120445251464844, -0.02663421630859375, -0.024147987365722656, -0.021661758422851562, -0.01917552947998047, -0.016689300537109375, -0.014203071594238281, -0.011716842651367188, -0.009230613708496094, -0.006744384765625, -0.004258155822753906, -0.0017719268798828125, 0.0007143020629882812, 0.003200531005859375, 0.005686759948730469, 0.008172988891601562, 0.010659217834472656, 0.01314544677734375, 0.015631675720214844, 0.018117904663085938, 0.02060413360595703, 0.023090362548828125, 0.02557659149169922, 0.028062820434570312, 0.030549049377441406, 0.0330352783203125, 0.035521507263183594, 0.03800773620605469, 0.04049396514892578, 0.042980194091796875, 0.04546642303466797, 0.04795265197753906, 0.050438880920410156, 0.05292510986328125, 0.055411338806152344, 0.05789756774902344, 0.06038379669189453, 0.06287002563476562, 0.06535625457763672, 0.06784248352050781, 0.0703287124633789, 0.07281494140625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 1.0, 3.0, 6.0, 9.0, 10.0, 13.0, 18.0, 22.0, 40.0, 50.0, 64.0, 80.0, 98.0, 105.0, 95.0, 94.0, 70.0, 54.0, 40.0, 26.0, 34.0, 22.0, 10.0, 10.0, 5.0, 3.0, 6.0, 4.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.441375732421875e-05, -9.152665734291077e-05, -8.863955736160278e-05, -8.57524573802948e-05, -8.286535739898682e-05, -7.997825741767883e-05, -7.709115743637085e-05, -7.420405745506287e-05, -7.131695747375488e-05, -6.84298574924469e-05, -6.554275751113892e-05, -6.265565752983093e-05, -5.976855754852295e-05, -5.6881457567214966e-05, -5.399435758590698e-05, -5.1107257604599e-05, -4.8220157623291016e-05, -4.533305764198303e-05, -4.244595766067505e-05, -3.9558857679367065e-05, -3.667175769805908e-05, -3.37846577167511e-05, -3.0897557735443115e-05, -2.8010457754135132e-05, -2.512335777282715e-05, -2.2236257791519165e-05, -1.934915781021118e-05, -1.6462057828903198e-05, -1.3574957847595215e-05, -1.0687857866287231e-05, -7.800757884979248e-06, -4.913657903671265e-06, -2.0265579223632812e-06, 8.605420589447021e-07, 3.7476420402526855e-06, 6.634742021560669e-06, 9.521842002868652e-06, 1.2408941984176636e-05, 1.529604196548462e-05, 1.8183141946792603e-05, 2.1070241928100586e-05, 2.395734190940857e-05, 2.6844441890716553e-05, 2.9731541872024536e-05, 3.261864185333252e-05, 3.55057418346405e-05, 3.8392841815948486e-05, 4.127994179725647e-05, 4.416704177856445e-05, 4.7054141759872437e-05, 4.994124174118042e-05, 5.28283417224884e-05, 5.571544170379639e-05, 5.860254168510437e-05, 6.148964166641235e-05, 6.437674164772034e-05, 6.726384162902832e-05, 7.01509416103363e-05, 7.303804159164429e-05, 7.592514157295227e-05, 7.881224155426025e-05, 8.169934153556824e-05, 8.458644151687622e-05, 8.74735414981842e-05, 9.036064147949219e-05]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 4.0, 5.0, 11.0, 12.0, 13.0, 27.0, 29.0, 32.0, 64.0, 98.0, 360.0, 4012.0, 312282.0, 720970.0, 9691.0, 556.0, 141.0, 71.0, 42.0, 40.0, 18.0, 18.0, 15.0, 14.0, 3.0, 4.0, 5.0, 6.0, 2.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.40380859375, -0.3916168212890625, -0.379425048828125, -0.3672332763671875, -0.35504150390625, -0.3428497314453125, -0.330657958984375, -0.3184661865234375, -0.3062744140625, -0.2940826416015625, -0.281890869140625, -0.2696990966796875, -0.25750732421875, -0.2453155517578125, -0.233123779296875, -0.2209320068359375, -0.208740234375, -0.1965484619140625, -0.184356689453125, -0.1721649169921875, -0.15997314453125, -0.1477813720703125, -0.135589599609375, -0.1233978271484375, -0.1112060546875, -0.0990142822265625, -0.086822509765625, -0.0746307373046875, -0.06243896484375, -0.0502471923828125, -0.038055419921875, -0.0258636474609375, -0.013671875, -0.0014801025390625, 0.010711669921875, 0.0229034423828125, 0.03509521484375, 0.0472869873046875, 0.059478759765625, 0.0716705322265625, 0.0838623046875, 0.0960540771484375, 0.108245849609375, 0.1204376220703125, 0.13262939453125, 0.1448211669921875, 0.157012939453125, 0.1692047119140625, 0.181396484375, 0.1935882568359375, 0.205780029296875, 0.2179718017578125, 0.23016357421875, 0.2423553466796875, 0.254547119140625, 0.2667388916015625, 0.2789306640625, 0.2911224365234375, 0.303314208984375, 0.3155059814453125, 0.32769775390625, 0.3398895263671875, 0.352081298828125, 0.3642730712890625, 0.37646484375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 4.0, 5.0, 7.0, 6.0, 7.0, 5.0, 9.0, 14.0, 19.0, 20.0, 19.0, 13.0, 26.0, 25.0, 39.0, 39.0, 30.0, 32.0, 40.0, 40.0, 48.0, 47.0, 57.0, 39.0, 39.0, 40.0, 42.0, 34.0, 33.0, 34.0, 25.0, 23.0, 18.0, 22.0, 18.0, 13.0, 15.0, 9.0, 7.0, 6.0, 7.0, 4.0, 9.0, 3.0, 2.0, 5.0, 1.0, 1.0, 2.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0205841064453125, -0.019893646240234375, -0.01920318603515625, -0.018512725830078125, -0.017822265625, -0.017131805419921875, -0.01644134521484375, -0.015750885009765625, -0.0150604248046875, -0.014369964599609375, -0.01367950439453125, -0.012989044189453125, -0.012298583984375, -0.011608123779296875, -0.01091766357421875, -0.010227203369140625, -0.0095367431640625, -0.008846282958984375, -0.00815582275390625, -0.007465362548828125, -0.00677490234375, -0.006084442138671875, -0.00539398193359375, -0.004703521728515625, -0.0040130615234375, -0.003322601318359375, -0.00263214111328125, -0.001941680908203125, -0.001251220703125, -0.000560760498046875, 0.00012969970703125, 0.000820159912109375, 0.0015106201171875, 0.002201080322265625, 0.00289154052734375, 0.003582000732421875, 0.0042724609375, 0.004962921142578125, 0.00565338134765625, 0.006343841552734375, 0.0070343017578125, 0.007724761962890625, 0.00841522216796875, 0.009105682373046875, 0.009796142578125, 0.010486602783203125, 0.01117706298828125, 0.011867523193359375, 0.0125579833984375, 0.013248443603515625, 0.01393890380859375, 0.014629364013671875, 0.01531982421875, 0.016010284423828125, 0.01670074462890625, 0.017391204833984375, 0.0180816650390625, 0.018772125244140625, 0.01946258544921875, 0.020153045654296875, 0.020843505859375, 0.021533966064453125, 0.02222442626953125, 0.022914886474609375, 0.0236053466796875]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 4.0, 8.0, 19.0, 26.0, 34.0, 79.0, 98.0, 110.0, 145.0, 152.0, 103.0, 85.0, 56.0, 40.0, 21.0, 7.0, 9.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9421945214271545, -0.9026233553886414, -0.8630521297454834, -0.8234809637069702, -0.7839097380638123, -0.7443385720252991, -0.7047673463821411, -0.6651961803436279, -0.6256250143051147, -0.5860538482666016, -0.5464826226234436, -0.5069114565849304, -0.46734023094177246, -0.4277690649032593, -0.3881978690624237, -0.34862667322158813, -0.3090554475784302, -0.2694842517375946, -0.22991305589675903, -0.19034187495708466, -0.15077067911624908, -0.11119948327541351, -0.07162830233573914, -0.032057106494903564, 0.007514089345932007, 0.04708528146147728, 0.08665647357702255, 0.12622766196727753, 0.1657988578081131, 0.20537005364894867, 0.24494123458862305, 0.2845124304294586, 0.3240835666656494, 0.363654762506485, 0.40322595834732056, 0.44279712438583374, 0.4823683500289917, 0.5219395160675049, 0.5615106821060181, 0.601081907749176, 0.640653133392334, 0.6802242994308472, 0.7197955250740051, 0.7593666911125183, 0.7989379167556763, 0.8385090827941895, 0.8780802488327026, 0.9176514744758606, 0.9572226405143738, 0.996793806552887, 1.036365032196045, 1.075936198234558, 1.1155073642730713, 1.155078649520874, 1.1946498155593872, 1.2342209815979004, 1.2737921476364136, 1.3133633136749268, 1.35293447971344, 1.3925057649612427, 1.4320769309997559, 1.471648097038269, 1.5112192630767822, 1.550790548324585, 1.5903617143630981]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 3.0, 6.0, 7.0, 9.0, 5.0, 9.0, 19.0, 23.0, 17.0, 30.0, 22.0, 36.0, 28.0, 37.0, 44.0, 43.0, 45.0, 38.0, 58.0, 37.0, 50.0, 65.0, 50.0, 45.0, 39.0, 32.0, 41.0, 34.0, 21.0, 26.0, 18.0, 15.0, 10.0, 7.0, 7.0, 12.0, 6.0, 6.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6159753203392029, -0.5949367880821228, -0.5738983154296875, -0.5528597831726074, -0.5318212509155273, -0.5107827186584473, -0.48974424600601196, -0.4687057137489319, -0.4476671814918518, -0.4266286790370941, -0.40559014678001404, -0.38455164432525635, -0.36351311206817627, -0.3424746096134186, -0.3214361071586609, -0.3003975749015808, -0.2793590724468231, -0.25832056999206543, -0.23728203773498535, -0.21624353528022766, -0.19520500302314758, -0.1741665005683899, -0.153127983212471, -0.13208946585655212, -0.11105094850063324, -0.09001243114471436, -0.06897391378879547, -0.047935403883457184, -0.0268968865275383, -0.005858369171619415, 0.015180140733718872, 0.036218658089637756, 0.05725717544555664, 0.07829569280147552, 0.09933421015739441, 0.1203727200627327, 0.14141124486923218, 0.16244974732398987, 0.18348826467990875, 0.20452678203582764, 0.22556529939174652, 0.2466038167476654, 0.2676423192024231, 0.2886808514595032, 0.30971935391426086, 0.33075788617134094, 0.35179638862609863, 0.3728349208831787, 0.3938734233379364, 0.4149119257926941, 0.43595045804977417, 0.45698896050453186, 0.47802749276161194, 0.49906599521636963, 0.5201045274734497, 0.5411430597305298, 0.5621815323829651, 0.5832200646400452, 0.6042585372924805, 0.6252970695495605, 0.6463356018066406, 0.6673741340637207, 0.688412606716156, 0.7094511389732361, 0.7304896712303162]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 4.0, 3.0, 2.0, 7.0, 5.0, 12.0, 17.0, 20.0, 12.0, 26.0, 55.0, 69.0, 78.0, 99.0, 164.0, 245.0, 401.0, 648.0, 1058.0, 1854.0, 3333.0, 6735.0, 14911.0, 40206.0, 148845.0, 541373.0, 203766.0, 49653.0, 18109.0, 7821.0, 3838.0, 2069.0, 1147.0, 632.0, 479.0, 239.0, 204.0, 122.0, 81.0, 55.0, 37.0, 26.0, 25.0, 17.0, 13.0, 11.0, 9.0, 5.0, 8.0, 6.0, 1.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.5546875, -0.5371322631835938, -0.5195770263671875, -0.5020217895507812, -0.484466552734375, -0.46691131591796875, -0.4493560791015625, -0.43180084228515625, -0.41424560546875, -0.39669036865234375, -0.3791351318359375, -0.36157989501953125, -0.344024658203125, -0.32646942138671875, -0.3089141845703125, -0.29135894775390625, -0.2738037109375, -0.25624847412109375, -0.2386932373046875, -0.22113800048828125, -0.203582763671875, -0.18602752685546875, -0.1684722900390625, -0.15091705322265625, -0.13336181640625, -0.11580657958984375, -0.0982513427734375, -0.08069610595703125, -0.063140869140625, -0.04558563232421875, -0.0280303955078125, -0.01047515869140625, 0.007080078125, 0.02463531494140625, 0.0421905517578125, 0.05974578857421875, 0.077301025390625, 0.09485626220703125, 0.1124114990234375, 0.12996673583984375, 0.14752197265625, 0.16507720947265625, 0.1826324462890625, 0.20018768310546875, 0.217742919921875, 0.23529815673828125, 0.2528533935546875, 0.27040863037109375, 0.2879638671875, 0.30551910400390625, 0.3230743408203125, 0.34062957763671875, 0.358184814453125, 0.37574005126953125, 0.3932952880859375, 0.41085052490234375, 0.42840576171875, 0.44596099853515625, 0.4635162353515625, 0.48107147216796875, 0.498626708984375, 0.5161819458007812, 0.5337371826171875, 0.5512924194335938, 0.56884765625]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 3.0, 5.0, 8.0, 5.0, 6.0, 16.0, 12.0, 13.0, 13.0, 22.0, 8.0, 29.0, 25.0, 25.0, 32.0, 34.0, 36.0, 37.0, 35.0, 55.0, 38.0, 43.0, 54.0, 57.0, 47.0, 49.0, 40.0, 45.0, 34.0, 32.0, 32.0, 26.0, 23.0, 12.0, 13.0, 20.0, 7.0, 6.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8193359375, -1.762969970703125, -1.70660400390625, -1.650238037109375, -1.5938720703125, -1.537506103515625, -1.48114013671875, -1.424774169921875, -1.368408203125, -1.312042236328125, -1.25567626953125, -1.199310302734375, -1.1429443359375, -1.086578369140625, -1.03021240234375, -0.973846435546875, -0.91748046875, -0.861114501953125, -0.80474853515625, -0.748382568359375, -0.6920166015625, -0.635650634765625, -0.57928466796875, -0.522918701171875, -0.466552734375, -0.410186767578125, -0.35382080078125, -0.297454833984375, -0.2410888671875, -0.184722900390625, -0.12835693359375, -0.071990966796875, -0.015625, 0.040740966796875, 0.09710693359375, 0.153472900390625, 0.2098388671875, 0.266204833984375, 0.32257080078125, 0.378936767578125, 0.435302734375, 0.491668701171875, 0.54803466796875, 0.604400634765625, 0.6607666015625, 0.717132568359375, 0.77349853515625, 0.829864501953125, 0.88623046875, 0.942596435546875, 0.99896240234375, 1.055328369140625, 1.1116943359375, 1.168060302734375, 1.22442626953125, 1.280792236328125, 1.337158203125, 1.393524169921875, 1.44989013671875, 1.506256103515625, 1.5626220703125, 1.618988037109375, 1.67535400390625, 1.731719970703125, 1.7880859375]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 4.0, 4.0, 7.0, 16.0, 17.0, 24.0, 25.0, 30.0, 48.0, 77.0, 67.0, 99.0, 223.0, 3021.0, 1043090.0, 1194.0, 177.0, 103.0, 77.0, 53.0, 51.0, 39.0, 21.0, 19.0, 16.0, 13.0, 9.0, 7.0, 5.0, 6.0, 4.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.4609375, -8.228515625, -7.99609375, -7.763671875, -7.53125, -7.298828125, -7.06640625, -6.833984375, -6.6015625, -6.369140625, -6.13671875, -5.904296875, -5.671875, -5.439453125, -5.20703125, -4.974609375, -4.7421875, -4.509765625, -4.27734375, -4.044921875, -3.8125, -3.580078125, -3.34765625, -3.115234375, -2.8828125, -2.650390625, -2.41796875, -2.185546875, -1.953125, -1.720703125, -1.48828125, -1.255859375, -1.0234375, -0.791015625, -0.55859375, -0.326171875, -0.09375, 0.138671875, 0.37109375, 0.603515625, 0.8359375, 1.068359375, 1.30078125, 1.533203125, 1.765625, 1.998046875, 2.23046875, 2.462890625, 2.6953125, 2.927734375, 3.16015625, 3.392578125, 3.625, 3.857421875, 4.08984375, 4.322265625, 4.5546875, 4.787109375, 5.01953125, 5.251953125, 5.484375, 5.716796875, 5.94921875, 6.181640625, 6.4140625]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 4.0, 3.0, 5.0, 10.0, 14.0, 18.0, 21.0, 25.0, 30.0, 35.0, 55.0, 46.0, 53.0, 67.0, 70.0, 58.0, 72.0, 74.0, 67.0, 54.0, 41.0, 42.0, 25.0, 30.0, 19.0, 16.0, 10.0, 10.0, 7.0, 7.0, 6.0, 3.0, 5.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.322265625, -3.23101806640625, -3.1397705078125, -3.04852294921875, -2.957275390625, -2.86602783203125, -2.7747802734375, -2.68353271484375, -2.59228515625, -2.50103759765625, -2.4097900390625, -2.31854248046875, -2.227294921875, -2.13604736328125, -2.0447998046875, -1.95355224609375, -1.8623046875, -1.77105712890625, -1.6798095703125, -1.58856201171875, -1.497314453125, -1.40606689453125, -1.3148193359375, -1.22357177734375, -1.13232421875, -1.04107666015625, -0.9498291015625, -0.85858154296875, -0.767333984375, -0.67608642578125, -0.5848388671875, -0.49359130859375, -0.40234375, -0.31109619140625, -0.2198486328125, -0.12860107421875, -0.037353515625, 0.05389404296875, 0.1451416015625, 0.23638916015625, 0.32763671875, 0.41888427734375, 0.5101318359375, 0.60137939453125, 0.692626953125, 0.78387451171875, 0.8751220703125, 0.96636962890625, 1.0576171875, 1.14886474609375, 1.2401123046875, 1.33135986328125, 1.422607421875, 1.51385498046875, 1.6051025390625, 1.69635009765625, 1.78759765625, 1.87884521484375, 1.9700927734375, 2.06134033203125, 2.152587890625, 2.24383544921875, 2.3350830078125, 2.42633056640625, 2.517578125]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 5.0, 2.0, 3.0, 9.0, 11.0, 18.0, 38.0, 93.0, 370.0, 4585.0, 1012531.0, 29838.0, 745.0, 150.0, 61.0, 35.0, 15.0, 17.0, 9.0, 3.0, 3.0, 9.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4306640625, -1.380828857421875, -1.33099365234375, -1.281158447265625, -1.2313232421875, -1.181488037109375, -1.13165283203125, -1.081817626953125, -1.031982421875, -0.982147216796875, -0.93231201171875, -0.882476806640625, -0.8326416015625, -0.782806396484375, -0.73297119140625, -0.683135986328125, -0.63330078125, -0.583465576171875, -0.53363037109375, -0.483795166015625, -0.4339599609375, -0.384124755859375, -0.33428955078125, -0.284454345703125, -0.234619140625, -0.184783935546875, -0.13494873046875, -0.085113525390625, -0.0352783203125, 0.014556884765625, 0.06439208984375, 0.114227294921875, 0.1640625, 0.213897705078125, 0.26373291015625, 0.313568115234375, 0.3634033203125, 0.413238525390625, 0.46307373046875, 0.512908935546875, 0.562744140625, 0.612579345703125, 0.66241455078125, 0.712249755859375, 0.7620849609375, 0.811920166015625, 0.86175537109375, 0.911590576171875, 0.96142578125, 1.011260986328125, 1.06109619140625, 1.110931396484375, 1.1607666015625, 1.210601806640625, 1.26043701171875, 1.310272216796875, 1.360107421875, 1.409942626953125, 1.45977783203125, 1.509613037109375, 1.5594482421875, 1.609283447265625, 1.65911865234375, 1.708953857421875, 1.7587890625]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 6.0, 1.0, 1.0, 2.0, 7.0, 4.0, 5.0, 11.0, 14.0, 17.0, 39.0, 50.0, 84.0, 166.0, 247.0, 137.0, 93.0, 36.0, 20.0, 25.0, 23.0, 3.0, 2.0, 2.0, 6.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.113550186157227e-05, -8.908286690711975e-05, -8.703023195266724e-05, -8.497759699821472e-05, -8.292496204376221e-05, -8.087232708930969e-05, -7.881969213485718e-05, -7.676705718040466e-05, -7.471442222595215e-05, -7.266178727149963e-05, -7.060915231704712e-05, -6.85565173625946e-05, -6.650388240814209e-05, -6.445124745368958e-05, -6.239861249923706e-05, -6.0345977544784546e-05, -5.829334259033203e-05, -5.6240707635879517e-05, -5.4188072681427e-05, -5.213543772697449e-05, -5.008280277252197e-05, -4.803016781806946e-05, -4.597753286361694e-05, -4.392489790916443e-05, -4.1872262954711914e-05, -3.98196280002594e-05, -3.7766993045806885e-05, -3.571435809135437e-05, -3.3661723136901855e-05, -3.160908818244934e-05, -2.9556453227996826e-05, -2.750381827354431e-05, -2.5451183319091797e-05, -2.3398548364639282e-05, -2.1345913410186768e-05, -1.9293278455734253e-05, -1.7240643501281738e-05, -1.5188008546829224e-05, -1.3135373592376709e-05, -1.1082738637924194e-05, -9.03010368347168e-06, -6.977468729019165e-06, -4.92483377456665e-06, -2.8721988201141357e-06, -8.195638656616211e-07, 1.2330710887908936e-06, 3.285706043243408e-06, 5.338340997695923e-06, 7.3909759521484375e-06, 9.443610906600952e-06, 1.1496245861053467e-05, 1.3548880815505981e-05, 1.5601515769958496e-05, 1.765415072441101e-05, 1.9706785678863525e-05, 2.175942063331604e-05, 2.3812055587768555e-05, 2.586469054222107e-05, 2.7917325496673584e-05, 2.99699604511261e-05, 3.202259540557861e-05, 3.407523036003113e-05, 3.612786531448364e-05, 3.818050026893616e-05, 4.023313522338867e-05]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 4.0, 5.0, 6.0, 11.0, 13.0, 18.0, 23.0, 38.0, 74.0, 205.0, 932.0, 18461.0, 1008751.0, 18538.0, 1070.0, 231.0, 69.0, 39.0, 22.0, 15.0, 8.0, 4.0, 8.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-1.47265625, -1.4371719360351562, -1.4016876220703125, -1.3662033081054688, -1.330718994140625, -1.2952346801757812, -1.2597503662109375, -1.2242660522460938, -1.18878173828125, -1.1532974243164062, -1.1178131103515625, -1.0823287963867188, -1.046844482421875, -1.0113601684570312, -0.9758758544921875, -0.9403915405273438, -0.9049072265625, -0.8694229125976562, -0.8339385986328125, -0.7984542846679688, -0.762969970703125, -0.7274856567382812, -0.6920013427734375, -0.6565170288085938, -0.62103271484375, -0.5855484008789062, -0.5500640869140625, -0.5145797729492188, -0.479095458984375, -0.44361114501953125, -0.4081268310546875, -0.37264251708984375, -0.337158203125, -0.30167388916015625, -0.2661895751953125, -0.23070526123046875, -0.195220947265625, -0.15973663330078125, -0.1242523193359375, -0.08876800537109375, -0.05328369140625, -0.01779937744140625, 0.0176849365234375, 0.05316925048828125, 0.088653564453125, 0.12413787841796875, 0.1596221923828125, 0.19510650634765625, 0.2305908203125, 0.26607513427734375, 0.3015594482421875, 0.33704376220703125, 0.372528076171875, 0.40801239013671875, 0.4434967041015625, 0.47898101806640625, 0.51446533203125, 0.5499496459960938, 0.5854339599609375, 0.6209182739257812, 0.656402587890625, 0.6918869018554688, 0.7273712158203125, 0.7628555297851562, 0.79833984375]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 6.0, 5.0, 7.0, 7.0, 11.0, 17.0, 16.0, 48.0, 60.0, 83.0, 169.0, 224.0, 118.0, 75.0, 37.0, 30.0, 25.0, 13.0, 16.0, 10.0, 6.0, 5.0, 8.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1075439453125, -0.10291671752929688, -0.09828948974609375, -0.09366226196289062, -0.0890350341796875, -0.08440780639648438, -0.07978057861328125, -0.07515335083007812, -0.070526123046875, -0.06589889526367188, -0.06127166748046875, -0.056644439697265625, -0.0520172119140625, -0.047389984130859375, -0.04276275634765625, -0.038135528564453125, -0.03350830078125, -0.028881072998046875, -0.02425384521484375, -0.019626617431640625, -0.0149993896484375, -0.010372161865234375, -0.00574493408203125, -0.001117706298828125, 0.003509521484375, 0.008136749267578125, 0.01276397705078125, 0.017391204833984375, 0.0220184326171875, 0.026645660400390625, 0.03127288818359375, 0.035900115966796875, 0.04052734375, 0.045154571533203125, 0.04978179931640625, 0.054409027099609375, 0.0590362548828125, 0.06366348266601562, 0.06829071044921875, 0.07291793823242188, 0.077545166015625, 0.08217239379882812, 0.08679962158203125, 0.09142684936523438, 0.0960540771484375, 0.10068130493164062, 0.10530853271484375, 0.10993576049804688, 0.11456298828125, 0.11919021606445312, 0.12381744384765625, 0.12844467163085938, 0.1330718994140625, 0.13769912719726562, 0.14232635498046875, 0.14695358276367188, 0.151580810546875, 0.15620803833007812, 0.16083526611328125, 0.16546249389648438, 0.1700897216796875, 0.17471694946289062, 0.17934417724609375, 0.18397140502929688, 0.1885986328125]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 7.0, 63.0, 460.0, 441.0, 46.0, 3.0, 1.0], "bins": [-21.95492935180664, -21.588531494140625, -21.22213363647461, -20.855735778808594, -20.489337921142578, -20.122940063476562, -19.756542205810547, -19.39014434814453, -19.023746490478516, -18.6573486328125, -18.290950775146484, -17.92455291748047, -17.558155059814453, -17.191757202148438, -16.825359344482422, -16.458961486816406, -16.092565536499023, -15.726167678833008, -15.359769821166992, -14.993371963500977, -14.626974105834961, -14.260577201843262, -13.894179344177246, -13.52778148651123, -13.161383628845215, -12.7949857711792, -12.428587913513184, -12.062190055847168, -11.695793151855469, -11.329395294189453, -10.962997436523438, -10.596599578857422, -10.230201721191406, -9.86380386352539, -9.497406005859375, -9.13100814819336, -8.764610290527344, -8.398213386535645, -8.031815528869629, -7.665417671203613, -7.299019813537598, -6.932621955871582, -6.566224098205566, -6.199826717376709, -5.833428859710693, -5.467031002044678, -5.10063362121582, -4.734235763549805, -4.367837905883789, -4.001440048217773, -3.635042428970337, -3.2686448097229004, -2.9022469520568848, -2.535849094390869, -2.1694514751434326, -1.803053855895996, -1.4366559982299805, -1.0702582597732544, -0.7038605213165283, -0.33746278285980225, 0.028934955596923828, 0.3953326940536499, 0.761730432510376, 1.1281280517578125, 1.4945259094238281]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 1.0, 0.0, 2.0, 4.0, 4.0, 1.0, 8.0, 8.0, 12.0, 10.0, 12.0, 17.0, 21.0, 20.0, 26.0, 27.0, 20.0, 36.0, 42.0, 40.0, 35.0, 44.0, 49.0, 50.0, 42.0, 45.0, 46.0, 52.0, 35.0, 43.0, 34.0, 42.0, 37.0, 22.0, 25.0, 12.0, 21.0, 16.0, 9.0, 7.0, 5.0, 6.0, 8.0, 5.0, 6.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.004420280456543, -2.91115140914917, -2.817882776260376, -2.724614143371582, -2.631345272064209, -2.538076400756836, -2.444807767868042, -2.351539134979248, -2.258270263671875, -2.165001392364502, -2.071732759475708, -1.9784640073776245, -1.885195255279541, -1.7919265031814575, -1.698657751083374, -1.6053889989852905, -1.512120246887207, -1.4188514947891235, -1.32558274269104, -1.2323139905929565, -1.139045238494873, -1.0457764863967896, -0.952507734298706, -0.8592389822006226, -0.7659702301025391, -0.6727014780044556, -0.5794327259063721, -0.4861639738082886, -0.3928952217102051, -0.2996264696121216, -0.20635771751403809, -0.11308896541595459, -0.019820451736450195, 0.0734483003616333, 0.1667170524597168, 0.2599858045578003, 0.3532545566558838, 0.4465233087539673, 0.5397920608520508, 0.6330608129501343, 0.7263295650482178, 0.8195983171463013, 0.9128670692443848, 1.0061358213424683, 1.0994045734405518, 1.1926733255386353, 1.2859420776367188, 1.3792108297348022, 1.4724795818328857, 1.5657483339309692, 1.6590170860290527, 1.7522858381271362, 1.8455545902252197, 1.9388233423233032, 2.0320920944213867, 2.1253609657287598, 2.2186295986175537, 2.3118982315063477, 2.4051671028137207, 2.4984359741210938, 2.5917046070098877, 2.6849732398986816, 2.7782421112060547, 2.8715109825134277, 2.9647796154022217]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 0.0, 6.0, 3.0, 4.0, 8.0, 6.0, 17.0, 13.0, 14.0, 14.0, 21.0, 25.0, 24.0, 26.0, 23.0, 33.0, 50.0, 106.0, 355.0, 1991.0, 23901.0, 2346223.0, 1798905.0, 20144.0, 1698.0, 294.0, 86.0, 57.0, 41.0, 34.0, 22.0, 22.0, 20.0, 23.0, 12.0, 15.0, 10.0, 10.0, 5.0, 8.0, 4.0, 0.0, 6.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7734375, -2.680877685546875, -2.58831787109375, -2.495758056640625, -2.4031982421875, -2.310638427734375, -2.21807861328125, -2.125518798828125, -2.032958984375, -1.940399169921875, -1.84783935546875, -1.755279541015625, -1.6627197265625, -1.570159912109375, -1.47760009765625, -1.385040283203125, -1.29248046875, -1.199920654296875, -1.10736083984375, -1.014801025390625, -0.9222412109375, -0.829681396484375, -0.73712158203125, -0.644561767578125, -0.552001953125, -0.459442138671875, -0.36688232421875, -0.274322509765625, -0.1817626953125, -0.089202880859375, 0.00335693359375, 0.095916748046875, 0.1884765625, 0.281036376953125, 0.37359619140625, 0.466156005859375, 0.5587158203125, 0.651275634765625, 0.74383544921875, 0.836395263671875, 0.928955078125, 1.021514892578125, 1.11407470703125, 1.206634521484375, 1.2991943359375, 1.391754150390625, 1.48431396484375, 1.576873779296875, 1.66943359375, 1.761993408203125, 1.85455322265625, 1.947113037109375, 2.0396728515625, 2.132232666015625, 2.22479248046875, 2.317352294921875, 2.409912109375, 2.502471923828125, 2.59503173828125, 2.687591552734375, 2.7801513671875, 2.872711181640625, 2.96527099609375, 3.057830810546875, 3.150390625]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 4.0, 14.0, 8.0, 14.0, 13.0, 16.0, 24.0, 27.0, 28.0, 34.0, 40.0, 41.0, 37.0, 50.0, 51.0, 50.0, 45.0, 60.0, 51.0, 48.0, 43.0, 53.0, 35.0, 40.0, 33.0, 25.0, 24.0, 17.0, 16.0, 13.0, 8.0, 11.0, 8.0, 3.0, 8.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.74365234375, -0.7209320068359375, -0.698211669921875, -0.6754913330078125, -0.65277099609375, -0.6300506591796875, -0.607330322265625, -0.5846099853515625, -0.5618896484375, -0.5391693115234375, -0.516448974609375, -0.4937286376953125, -0.47100830078125, -0.4482879638671875, -0.425567626953125, -0.4028472900390625, -0.380126953125, -0.3574066162109375, -0.334686279296875, -0.3119659423828125, -0.28924560546875, -0.2665252685546875, -0.243804931640625, -0.2210845947265625, -0.1983642578125, -0.1756439208984375, -0.152923583984375, -0.1302032470703125, -0.10748291015625, -0.0847625732421875, -0.062042236328125, -0.0393218994140625, -0.0166015625, 0.0061187744140625, 0.028839111328125, 0.0515594482421875, 0.07427978515625, 0.0970001220703125, 0.119720458984375, 0.1424407958984375, 0.1651611328125, 0.1878814697265625, 0.210601806640625, 0.2333221435546875, 0.25604248046875, 0.2787628173828125, 0.301483154296875, 0.3242034912109375, 0.346923828125, 0.3696441650390625, 0.392364501953125, 0.4150848388671875, 0.43780517578125, 0.4605255126953125, 0.483245849609375, 0.5059661865234375, 0.5286865234375, 0.5514068603515625, 0.574127197265625, 0.5968475341796875, 0.61956787109375, 0.6422882080078125, 0.665008544921875, 0.6877288818359375, 0.71044921875]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 2.0, 4.0, 6.0, 2.0, 5.0, 8.0, 14.0, 14.0, 37.0, 52.0, 100.0, 189.0, 373.0, 1424.0, 1751784.0, 2437976.0, 1413.0, 413.0, 190.0, 112.0, 72.0, 29.0, 19.0, 14.0, 17.0, 3.0, 6.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.5, -7.241455078125, -6.98291015625, -6.724365234375, -6.4658203125, -6.207275390625, -5.94873046875, -5.690185546875, -5.431640625, -5.173095703125, -4.91455078125, -4.656005859375, -4.3974609375, -4.138916015625, -3.88037109375, -3.621826171875, -3.36328125, -3.104736328125, -2.84619140625, -2.587646484375, -2.3291015625, -2.070556640625, -1.81201171875, -1.553466796875, -1.294921875, -1.036376953125, -0.77783203125, -0.519287109375, -0.2607421875, -0.002197265625, 0.25634765625, 0.514892578125, 0.7734375, 1.031982421875, 1.29052734375, 1.549072265625, 1.8076171875, 2.066162109375, 2.32470703125, 2.583251953125, 2.841796875, 3.100341796875, 3.35888671875, 3.617431640625, 3.8759765625, 4.134521484375, 4.39306640625, 4.651611328125, 4.91015625, 5.168701171875, 5.42724609375, 5.685791015625, 5.9443359375, 6.202880859375, 6.46142578125, 6.719970703125, 6.978515625, 7.237060546875, 7.49560546875, 7.754150390625, 8.0126953125, 8.271240234375, 8.52978515625, 8.788330078125, 9.046875]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 6.0, 5.0, 7.0, 9.0, 20.0, 15.0, 22.0, 42.0, 78.0, 116.0, 206.0, 419.0, 740.0, 979.0, 635.0, 338.0, 185.0, 100.0, 54.0, 42.0, 19.0, 15.0, 5.0, 8.0, 7.0, 5.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.5556640625, -0.5385055541992188, -0.5213470458984375, -0.5041885375976562, -0.487030029296875, -0.46987152099609375, -0.4527130126953125, -0.43555450439453125, -0.41839599609375, -0.40123748779296875, -0.3840789794921875, -0.36692047119140625, -0.349761962890625, -0.33260345458984375, -0.3154449462890625, -0.29828643798828125, -0.2811279296875, -0.26396942138671875, -0.2468109130859375, -0.22965240478515625, -0.212493896484375, -0.19533538818359375, -0.1781768798828125, -0.16101837158203125, -0.14385986328125, -0.12670135498046875, -0.1095428466796875, -0.09238433837890625, -0.075225830078125, -0.05806732177734375, -0.0409088134765625, -0.02375030517578125, -0.006591796875, 0.01056671142578125, 0.0277252197265625, 0.04488372802734375, 0.062042236328125, 0.07920074462890625, 0.0963592529296875, 0.11351776123046875, 0.13067626953125, 0.14783477783203125, 0.1649932861328125, 0.18215179443359375, 0.199310302734375, 0.21646881103515625, 0.2336273193359375, 0.25078582763671875, 0.2679443359375, 0.28510284423828125, 0.3022613525390625, 0.31941986083984375, 0.336578369140625, 0.35373687744140625, 0.3708953857421875, 0.38805389404296875, 0.40521240234375, 0.42237091064453125, 0.4395294189453125, 0.45668792724609375, 0.473846435546875, 0.49100494384765625, 0.5081634521484375, 0.5253219604492188, 0.54248046875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 5.0, 5.0, 7.0, 9.0, 22.0, 15.0, 10.0, 35.0, 35.0, 36.0, 49.0, 56.0, 77.0, 69.0, 67.0, 82.0, 70.0, 53.0, 54.0, 54.0, 32.0, 30.0, 27.0, 21.0, 17.0, 9.0, 10.0, 13.0, 6.0, 1.0, 7.0, 7.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.9879431128501892, -0.9588159918785095, -0.9296888113021851, -0.9005616903305054, -0.8714345693588257, -0.842307448387146, -0.8131802678108215, -0.7840531468391418, -0.7549259662628174, -0.7257988452911377, -0.6966716647148132, -0.6675445437431335, -0.6384174227714539, -0.6092902421951294, -0.5801631212234497, -0.55103600025177, -0.5219088792800903, -0.49278172850608826, -0.46365460753440857, -0.4345274567604065, -0.4054003357887268, -0.37627318501472473, -0.34714603424072266, -0.31801891326904297, -0.2888917624950409, -0.2597646117210388, -0.23063749074935913, -0.20151033997535706, -0.17238320410251617, -0.1432560682296753, -0.11412891745567322, -0.08500178158283234, -0.05587470531463623, -0.02674756571650505, 0.002379573881626129, 0.03150671720504761, 0.06063385307788849, 0.08976098895072937, 0.11888813972473145, 0.14801527559757233, 0.1771424114704132, 0.2062695473432541, 0.23539668321609497, 0.26452383399009705, 0.2936509847640991, 0.3227781057357788, 0.3519052565097809, 0.38103240728378296, 0.41015952825546265, 0.4392866790294647, 0.4684138000011444, 0.4975409507751465, 0.5266680717468262, 0.5557951927185059, 0.5849223732948303, 0.61404949426651, 0.6431766748428345, 0.6723037958145142, 0.7014309763908386, 0.7305580973625183, 0.759685218334198, 0.7888123989105225, 0.8179395198822021, 0.8470666408538818, 0.8761937618255615]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 5.0, 7.0, 5.0, 7.0, 14.0, 19.0, 20.0, 12.0, 24.0, 23.0, 16.0, 33.0, 29.0, 36.0, 45.0, 33.0, 30.0, 42.0, 41.0, 52.0, 46.0, 36.0, 36.0, 40.0, 37.0, 38.0, 34.0, 29.0, 25.0, 30.0, 21.0, 28.0, 20.0, 15.0, 18.0, 12.0, 13.0, 7.0, 3.0, 8.0, 5.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.6997560262680054, -0.6777433753013611, -0.655730664730072, -0.6337180137634277, -0.6117053031921387, -0.5896926522254944, -0.5676800012588501, -0.545667290687561, -0.523654580116272, -0.5016419291496277, -0.4796292185783386, -0.45761656761169434, -0.4356038570404053, -0.413591206073761, -0.3915785253047943, -0.36956584453582764, -0.34755319356918335, -0.3255405128002167, -0.30352783203125, -0.2815151810646057, -0.25950247049331665, -0.23748980462551117, -0.2154771387577057, -0.193464457988739, -0.17145177721977234, -0.14943909645080566, -0.127426415681839, -0.10541374981403351, -0.08340106904506683, -0.06138838827610016, -0.03937572240829468, -0.017363041639328003, 0.0046495795249938965, 0.026662256568670273, 0.04867493361234665, 0.07068760693073273, 0.0927002876996994, 0.11471296846866608, 0.13672563433647156, 0.15873831510543823, 0.1807509958744049, 0.20276367664337158, 0.22477635741233826, 0.24678902328014374, 0.2688016891479492, 0.2908143997192383, 0.31282705068588257, 0.33483973145484924, 0.3568524122238159, 0.3788650929927826, 0.40087777376174927, 0.42289042472839355, 0.4449031352996826, 0.4669157862663269, 0.4889284670352936, 0.5109411478042603, 0.5329538583755493, 0.5549665093421936, 0.5769792199134827, 0.598991870880127, 0.621004581451416, 0.6430172324180603, 0.6650298833847046, 0.6870425939559937, 0.7090552449226379]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 5.0, 3.0, 4.0, 6.0, 6.0, 8.0, 10.0, 15.0, 21.0, 35.0, 41.0, 76.0, 122.0, 205.0, 376.0, 804.0, 1462.0, 3225.0, 6902.0, 15143.0, 38639.0, 123677.0, 442241.0, 293221.0, 74988.0, 26281.0, 11143.0, 5072.0, 2332.0, 1169.0, 569.0, 300.0, 162.0, 102.0, 62.0, 45.0, 20.0, 22.0, 11.0, 6.0, 9.0, 8.0, 4.0, 5.0, 0.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.477294921875, -0.4635810852050781, -0.44986724853515625, -0.4361534118652344, -0.4224395751953125, -0.4087257385253906, -0.39501190185546875, -0.3812980651855469, -0.367584228515625, -0.3538703918457031, -0.34015655517578125, -0.3264427185058594, -0.3127288818359375, -0.2990150451660156, -0.28530120849609375, -0.2715873718261719, -0.25787353515625, -0.24415969848632812, -0.23044586181640625, -0.21673202514648438, -0.2030181884765625, -0.18930435180664062, -0.17559051513671875, -0.16187667846679688, -0.148162841796875, -0.13444900512695312, -0.12073516845703125, -0.10702133178710938, -0.0933074951171875, -0.07959365844726562, -0.06587982177734375, -0.052165985107421875, -0.0384521484375, -0.024738311767578125, -0.01102447509765625, 0.002689361572265625, 0.0164031982421875, 0.030117034912109375, 0.04383087158203125, 0.057544708251953125, 0.071258544921875, 0.08497238159179688, 0.09868621826171875, 0.11240005493164062, 0.1261138916015625, 0.13982772827148438, 0.15354156494140625, 0.16725540161132812, 0.18096923828125, 0.19468307495117188, 0.20839691162109375, 0.22211074829101562, 0.2358245849609375, 0.24953842163085938, 0.26325225830078125, 0.2769660949707031, 0.290679931640625, 0.3043937683105469, 0.31810760498046875, 0.3318214416503906, 0.3455352783203125, 0.3592491149902344, 0.37296295166015625, 0.3866767883300781, 0.400390625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 5.0, 4.0, 5.0, 12.0, 13.0, 21.0, 26.0, 26.0, 26.0, 30.0, 33.0, 38.0, 43.0, 40.0, 46.0, 50.0, 45.0, 41.0, 48.0, 49.0, 39.0, 48.0, 39.0, 48.0, 41.0, 26.0, 26.0, 20.0, 18.0, 19.0, 8.0, 19.0, 13.0, 9.0, 5.0, 3.0, 2.0, 2.0, 4.0, 1.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.435546875, -0.42089080810546875, -0.4062347412109375, -0.39157867431640625, -0.376922607421875, -0.36226654052734375, -0.3476104736328125, -0.33295440673828125, -0.31829833984375, -0.30364227294921875, -0.2889862060546875, -0.27433013916015625, -0.259674072265625, -0.24501800537109375, -0.2303619384765625, -0.21570587158203125, -0.2010498046875, -0.18639373779296875, -0.1717376708984375, -0.15708160400390625, -0.142425537109375, -0.12776947021484375, -0.1131134033203125, -0.09845733642578125, -0.08380126953125, -0.06914520263671875, -0.0544891357421875, -0.03983306884765625, -0.025177001953125, -0.01052093505859375, 0.0041351318359375, 0.01879119873046875, 0.033447265625, 0.04810333251953125, 0.0627593994140625, 0.07741546630859375, 0.092071533203125, 0.10672760009765625, 0.1213836669921875, 0.13603973388671875, 0.15069580078125, 0.16535186767578125, 0.1800079345703125, 0.19466400146484375, 0.209320068359375, 0.22397613525390625, 0.2386322021484375, 0.25328826904296875, 0.2679443359375, 0.28260040283203125, 0.2972564697265625, 0.31191253662109375, 0.326568603515625, 0.34122467041015625, 0.3558807373046875, 0.37053680419921875, 0.38519287109375, 0.39984893798828125, 0.4145050048828125, 0.42916107177734375, 0.443817138671875, 0.45847320556640625, 0.4731292724609375, 0.48778533935546875, 0.50244140625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 5.0, 8.0, 13.0, 14.0, 22.0, 24.0, 43.0, 66.0, 102.0, 120.0, 205.0, 309.0, 484.0, 849.0, 1423.0, 2479.0, 4573.0, 8801.0, 17623.0, 37446.0, 88961.0, 222174.0, 339829.0, 185494.0, 73340.0, 32065.0, 14990.0, 7583.0, 3996.0, 2187.0, 1281.0, 738.0, 472.0, 277.0, 182.0, 117.0, 87.0, 64.0, 27.0, 25.0, 20.0, 13.0, 10.0, 7.0, 3.0, 1.0, 5.0, 3.0, 1.0, 0.0, 2.0], "bins": [-0.26318359375, -0.2557487487792969, -0.24831390380859375, -0.24087905883789062, -0.2334442138671875, -0.22600936889648438, -0.21857452392578125, -0.21113967895507812, -0.203704833984375, -0.19626998901367188, -0.18883514404296875, -0.18140029907226562, -0.1739654541015625, -0.16653060913085938, -0.15909576416015625, -0.15166091918945312, -0.14422607421875, -0.13679122924804688, -0.12935638427734375, -0.12192153930664062, -0.1144866943359375, -0.10705184936523438, -0.09961700439453125, -0.09218215942382812, -0.084747314453125, -0.07731246948242188, -0.06987762451171875, -0.062442779541015625, -0.0550079345703125, -0.047573089599609375, -0.04013824462890625, -0.032703399658203125, -0.0252685546875, -0.017833709716796875, -0.01039886474609375, -0.002964019775390625, 0.0044708251953125, 0.011905670166015625, 0.01934051513671875, 0.026775360107421875, 0.034210205078125, 0.041645050048828125, 0.04907989501953125, 0.056514739990234375, 0.0639495849609375, 0.07138442993164062, 0.07881927490234375, 0.08625411987304688, 0.09368896484375, 0.10112380981445312, 0.10855865478515625, 0.11599349975585938, 0.1234283447265625, 0.13086318969726562, 0.13829803466796875, 0.14573287963867188, 0.153167724609375, 0.16060256958007812, 0.16803741455078125, 0.17547225952148438, 0.1829071044921875, 0.19034194946289062, 0.19777679443359375, 0.20521163940429688, 0.212646484375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 4.0, 8.0, 5.0, 11.0, 13.0, 16.0, 19.0, 19.0, 20.0, 40.0, 46.0, 64.0, 60.0, 60.0, 64.0, 65.0, 63.0, 65.0, 57.0, 48.0, 59.0, 38.0, 36.0, 33.0, 25.0, 12.0, 15.0, 12.0, 10.0, 3.0, 3.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.84130859375, -0.8064498901367188, -0.7715911865234375, -0.7367324829101562, -0.701873779296875, -0.6670150756835938, -0.6321563720703125, -0.5972976684570312, -0.56243896484375, -0.5275802612304688, -0.4927215576171875, -0.45786285400390625, -0.423004150390625, -0.38814544677734375, -0.3532867431640625, -0.31842803955078125, -0.2835693359375, -0.24871063232421875, -0.2138519287109375, -0.17899322509765625, -0.144134521484375, -0.10927581787109375, -0.0744171142578125, -0.03955841064453125, -0.00469970703125, 0.03015899658203125, 0.0650177001953125, 0.09987640380859375, 0.134735107421875, 0.16959381103515625, 0.2044525146484375, 0.23931121826171875, 0.274169921875, 0.30902862548828125, 0.3438873291015625, 0.37874603271484375, 0.413604736328125, 0.44846343994140625, 0.4833221435546875, 0.5181808471679688, 0.55303955078125, 0.5878982543945312, 0.6227569580078125, 0.6576156616210938, 0.692474365234375, 0.7273330688476562, 0.7621917724609375, 0.7970504760742188, 0.8319091796875, 0.8667678833007812, 0.9016265869140625, 0.9364852905273438, 0.971343994140625, 1.0062026977539062, 1.0410614013671875, 1.0759201049804688, 1.11077880859375, 1.1456375122070312, 1.1804962158203125, 1.2153549194335938, 1.250213623046875, 1.2850723266601562, 1.3199310302734375, 1.3547897338867188, 1.3896484375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 11.0, 13.0, 13.0, 16.0, 35.0, 58.0, 70.0, 115.0, 174.0, 279.0, 489.0, 833.0, 1419.0, 2620.0, 4893.0, 10517.0, 24441.0, 67428.0, 220571.0, 416991.0, 194806.0, 60025.0, 22443.0, 9761.0, 4806.0, 2457.0, 1334.0, 735.0, 456.0, 283.0, 149.0, 95.0, 61.0, 61.0, 36.0, 25.0, 11.0, 10.0, 3.0, 5.0, 6.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.098876953125, -0.09600639343261719, -0.09313583374023438, -0.09026527404785156, -0.08739471435546875, -0.08452415466308594, -0.08165359497070312, -0.07878303527832031, -0.0759124755859375, -0.07304191589355469, -0.07017135620117188, -0.06730079650878906, -0.06443023681640625, -0.06155967712402344, -0.058689117431640625, -0.05581855773925781, -0.052947998046875, -0.05007743835449219, -0.047206878662109375, -0.04433631896972656, -0.04146575927734375, -0.03859519958496094, -0.035724639892578125, -0.03285408020019531, -0.0299835205078125, -0.027112960815429688, -0.024242401123046875, -0.021371841430664062, -0.01850128173828125, -0.015630722045898438, -0.012760162353515625, -0.009889602661132812, -0.00701904296875, -0.0041484832763671875, -0.001277923583984375, 0.0015926361083984375, 0.00446319580078125, 0.0073337554931640625, 0.010204315185546875, 0.013074874877929688, 0.0159454345703125, 0.018815994262695312, 0.021686553955078125, 0.024557113647460938, 0.02742767333984375, 0.030298233032226562, 0.033168792724609375, 0.03603935241699219, 0.038909912109375, 0.04178047180175781, 0.044651031494140625, 0.04752159118652344, 0.05039215087890625, 0.05326271057128906, 0.056133270263671875, 0.05900382995605469, 0.0618743896484375, 0.06474494934082031, 0.06761550903320312, 0.07048606872558594, 0.07335662841796875, 0.07622718811035156, 0.07909774780273438, 0.08196830749511719, 0.0848388671875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 5.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 4.0, 2.0, 5.0, 6.0, 8.0, 14.0, 16.0, 27.0, 29.0, 59.0, 62.0, 75.0, 113.0, 147.0, 131.0, 91.0, 64.0, 25.0, 28.0, 18.0, 13.0, 14.0, 7.0, 6.0, 5.0, 2.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0], "bins": [-0.00010854005813598633, -0.00010555237531661987, -0.00010256469249725342, -9.957700967788696e-05, -9.658932685852051e-05, -9.360164403915405e-05, -9.06139612197876e-05, -8.762627840042114e-05, -8.463859558105469e-05, -8.165091276168823e-05, -7.866322994232178e-05, -7.567554712295532e-05, -7.268786430358887e-05, -6.970018148422241e-05, -6.671249866485596e-05, -6.37248158454895e-05, -6.073713302612305e-05, -5.774945020675659e-05, -5.476176738739014e-05, -5.177408456802368e-05, -4.8786401748657227e-05, -4.579871892929077e-05, -4.2811036109924316e-05, -3.982335329055786e-05, -3.6835670471191406e-05, -3.384798765182495e-05, -3.0860304832458496e-05, -2.787262201309204e-05, -2.4884939193725586e-05, -2.189725637435913e-05, -1.8909573554992676e-05, -1.592189073562622e-05, -1.2934207916259766e-05, -9.94652509689331e-06, -6.9588422775268555e-06, -3.9711594581604e-06, -9.834766387939453e-07, 2.0042061805725098e-06, 4.991888999938965e-06, 7.97957181930542e-06, 1.0967254638671875e-05, 1.395493745803833e-05, 1.6942620277404785e-05, 1.993030309677124e-05, 2.2917985916137695e-05, 2.590566873550415e-05, 2.8893351554870605e-05, 3.188103437423706e-05, 3.4868717193603516e-05, 3.785640001296997e-05, 4.0844082832336426e-05, 4.383176565170288e-05, 4.6819448471069336e-05, 4.980713129043579e-05, 5.2794814109802246e-05, 5.57824969291687e-05, 5.8770179748535156e-05, 6.175786256790161e-05, 6.474554538726807e-05, 6.773322820663452e-05, 7.072091102600098e-05, 7.370859384536743e-05, 7.669627666473389e-05, 7.968395948410034e-05, 8.26716423034668e-05]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 6.0, 7.0, 19.0, 11.0, 21.0, 41.0, 39.0, 81.0, 120.0, 273.0, 483.0, 1058.0, 2800.0, 9518.0, 51849.0, 448429.0, 464127.0, 54783.0, 9855.0, 2825.0, 1072.0, 511.0, 251.0, 131.0, 67.0, 44.0, 36.0, 27.0, 17.0, 13.0, 8.0, 6.0, 3.0, 7.0, 6.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.164794921875, -0.15964698791503906, -0.15449905395507812, -0.1493511199951172, -0.14420318603515625, -0.1390552520751953, -0.13390731811523438, -0.12875938415527344, -0.1236114501953125, -0.11846351623535156, -0.11331558227539062, -0.10816764831542969, -0.10301971435546875, -0.09787178039550781, -0.09272384643554688, -0.08757591247558594, -0.082427978515625, -0.07728004455566406, -0.07213211059570312, -0.06698417663574219, -0.06183624267578125, -0.05668830871582031, -0.051540374755859375, -0.04639244079589844, -0.0412445068359375, -0.03609657287597656, -0.030948638916015625, -0.025800704956054688, -0.02065277099609375, -0.015504837036132812, -0.010356903076171875, -0.0052089691162109375, -6.103515625e-05, 0.0050868988037109375, 0.010234832763671875, 0.015382766723632812, 0.02053070068359375, 0.025678634643554688, 0.030826568603515625, 0.03597450256347656, 0.0411224365234375, 0.04627037048339844, 0.051418304443359375, 0.05656623840332031, 0.06171417236328125, 0.06686210632324219, 0.07201004028320312, 0.07715797424316406, 0.082305908203125, 0.08745384216308594, 0.09260177612304688, 0.09774971008300781, 0.10289764404296875, 0.10804557800292969, 0.11319351196289062, 0.11834144592285156, 0.1234893798828125, 0.12863731384277344, 0.13378524780273438, 0.1389331817626953, 0.14408111572265625, 0.1492290496826172, 0.15437698364257812, 0.15952491760253906, 0.1646728515625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 6.0, 4.0, 6.0, 7.0, 8.0, 14.0, 19.0, 11.0, 31.0, 24.0, 49.0, 60.0, 66.0, 67.0, 82.0, 69.0, 83.0, 68.0, 76.0, 54.0, 45.0, 34.0, 25.0, 23.0, 19.0, 13.0, 7.0, 9.0, 5.0, 4.0, 5.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.02825927734375, -0.02743816375732422, -0.026617050170898438, -0.025795936584472656, -0.024974822998046875, -0.024153709411621094, -0.023332595825195312, -0.02251148223876953, -0.02169036865234375, -0.02086925506591797, -0.020048141479492188, -0.019227027893066406, -0.018405914306640625, -0.017584800720214844, -0.016763687133789062, -0.01594257354736328, -0.0151214599609375, -0.014300346374511719, -0.013479232788085938, -0.012658119201660156, -0.011837005615234375, -0.011015892028808594, -0.010194778442382812, -0.009373664855957031, -0.00855255126953125, -0.007731437683105469, -0.0069103240966796875, -0.006089210510253906, -0.005268096923828125, -0.004446983337402344, -0.0036258697509765625, -0.0028047561645507812, -0.001983642578125, -0.0011625289916992188, -0.0003414154052734375, 0.00047969818115234375, 0.001300811767578125, 0.0021219253540039062, 0.0029430389404296875, 0.0037641525268554688, 0.00458526611328125, 0.005406379699707031, 0.0062274932861328125, 0.007048606872558594, 0.007869720458984375, 0.008690834045410156, 0.009511947631835938, 0.010333061218261719, 0.0111541748046875, 0.011975288391113281, 0.012796401977539062, 0.013617515563964844, 0.014438629150390625, 0.015259742736816406, 0.016080856323242188, 0.01690196990966797, 0.01772308349609375, 0.01854419708251953, 0.019365310668945312, 0.020186424255371094, 0.021007537841796875, 0.021828651428222656, 0.022649765014648438, 0.02347087860107422, 0.0242919921875]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 6.0, 14.0, 16.0, 34.0, 65.0, 126.0, 144.0, 196.0, 155.0, 104.0, 67.0, 29.0, 25.0, 6.0, 10.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5643506050109863, -1.5246598720550537, -1.484969139099121, -1.4452784061431885, -1.4055876731872559, -1.3658969402313232, -1.3262062072753906, -1.286515474319458, -1.2468247413635254, -1.2071340084075928, -1.1674432754516602, -1.1277525424957275, -1.088061809539795, -1.0483710765838623, -1.0086803436279297, -0.9689896106719971, -0.9292988777160645, -0.8896081447601318, -0.8499174118041992, -0.8102266788482666, -0.770535945892334, -0.7308452129364014, -0.6911544799804688, -0.6514637470245361, -0.6117730140686035, -0.5720822811126709, -0.5323915481567383, -0.49270081520080566, -0.45301008224487305, -0.41331934928894043, -0.3736286163330078, -0.3339378833770752, -0.2942470908164978, -0.2545563578605652, -0.21486562490463257, -0.17517489194869995, -0.13548415899276733, -0.09579342603683472, -0.0561026930809021, -0.016411960124969482, 0.023278772830963135, 0.06296950578689575, 0.10266023874282837, 0.142350971698761, 0.1820417046546936, 0.22173243761062622, 0.26142317056655884, 0.30111390352249146, 0.3408046364784241, 0.3804953694343567, 0.4201861023902893, 0.4598768353462219, 0.49956756830215454, 0.5392583012580872, 0.5789490342140198, 0.6186397671699524, 0.658330500125885, 0.6980212330818176, 0.7377119660377502, 0.7774026989936829, 0.8170934319496155, 0.8567841649055481, 0.8964748978614807, 0.9361656308174133, 0.975856363773346]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 6.0, 6.0, 5.0, 9.0, 12.0, 5.0, 21.0, 17.0, 22.0, 20.0, 21.0, 30.0, 25.0, 32.0, 34.0, 32.0, 41.0, 44.0, 34.0, 48.0, 46.0, 37.0, 41.0, 41.0, 34.0, 42.0, 36.0, 40.0, 24.0, 22.0, 25.0, 29.0, 23.0, 12.0, 16.0, 11.0, 13.0, 10.0, 11.0, 5.0, 2.0, 7.0, 2.0, 0.0, 3.0, 2.0, 3.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.39865368604660034, -0.38615572452545166, -0.3736577332019806, -0.3611597716808319, -0.34866178035736084, -0.33616381883621216, -0.3236658573150635, -0.3111678659915924, -0.2986699044704437, -0.28617194294929504, -0.273673951625824, -0.2611759901046753, -0.24867801368236542, -0.23618003726005554, -0.22368206083774567, -0.2111840844154358, -0.19868610799312592, -0.18618813157081604, -0.17369015514850616, -0.1611921787261963, -0.1486942172050476, -0.13619624078273773, -0.12369826436042786, -0.11120029538869858, -0.0987023189663887, -0.08620434254407883, -0.07370637357234955, -0.06120839715003967, -0.048710424453020096, -0.03621245175600052, -0.023714475333690643, -0.011216506361961365, 0.0012814700603485107, 0.013779443688690662, 0.026277417317032814, 0.03877539187669754, 0.05127336457371712, 0.0637713372707367, 0.07626931369304657, 0.08876728266477585, 0.10126525908708572, 0.1137632355093956, 0.12626120448112488, 0.13875918090343475, 0.15125715732574463, 0.1637551188468933, 0.17625311017036438, 0.18875107169151306, 0.20124904811382294, 0.2137470245361328, 0.2262450009584427, 0.23874297738075256, 0.25124093890190125, 0.2637389302253723, 0.276236891746521, 0.2887348532676697, 0.30123284459114075, 0.31373080611228943, 0.3262287974357605, 0.3387267589569092, 0.35122475028038025, 0.36372271180152893, 0.376220703125, 0.3887186646461487, 0.40121662616729736]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 5.0, 5.0, 9.0, 12.0, 15.0, 18.0, 25.0, 49.0, 77.0, 106.0, 162.0, 212.0, 371.0, 621.0, 1061.0, 1719.0, 2998.0, 5419.0, 10299.0, 19949.0, 41034.0, 95475.0, 307930.0, 367556.0, 103787.0, 44041.0, 21144.0, 10878.0, 5699.0, 3178.0, 1831.0, 1088.0, 623.0, 411.0, 260.0, 147.0, 117.0, 72.0, 58.0, 19.0, 22.0, 11.0, 10.0, 10.0, 12.0, 3.0, 4.0, 2.0, 3.0, 0.0, 4.0, 0.0, 0.0, 1.0], "bins": [-0.471435546875, -0.4571685791015625, -0.442901611328125, -0.4286346435546875, -0.41436767578125, -0.4001007080078125, -0.385833740234375, -0.3715667724609375, -0.3572998046875, -0.3430328369140625, -0.328765869140625, -0.3144989013671875, -0.30023193359375, -0.2859649658203125, -0.271697998046875, -0.2574310302734375, -0.2431640625, -0.2288970947265625, -0.214630126953125, -0.2003631591796875, -0.18609619140625, -0.1718292236328125, -0.157562255859375, -0.1432952880859375, -0.1290283203125, -0.1147613525390625, -0.100494384765625, -0.0862274169921875, -0.07196044921875, -0.0576934814453125, -0.043426513671875, -0.0291595458984375, -0.014892578125, -0.0006256103515625, 0.013641357421875, 0.0279083251953125, 0.04217529296875, 0.0564422607421875, 0.070709228515625, 0.0849761962890625, 0.0992431640625, 0.1135101318359375, 0.127777099609375, 0.1420440673828125, 0.15631103515625, 0.1705780029296875, 0.184844970703125, 0.1991119384765625, 0.21337890625, 0.2276458740234375, 0.241912841796875, 0.2561798095703125, 0.27044677734375, 0.2847137451171875, 0.298980712890625, 0.3132476806640625, 0.3275146484375, 0.3417816162109375, 0.356048583984375, 0.3703155517578125, 0.38458251953125, 0.3988494873046875, 0.413116455078125, 0.4273834228515625, 0.441650390625]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 1.0, 7.0, 7.0, 12.0, 11.0, 12.0, 19.0, 17.0, 20.0, 29.0, 28.0, 33.0, 30.0, 48.0, 43.0, 37.0, 38.0, 49.0, 50.0, 52.0, 42.0, 52.0, 40.0, 51.0, 36.0, 32.0, 27.0, 33.0, 18.0, 26.0, 21.0, 18.0, 8.0, 9.0, 11.0, 9.0, 8.0, 4.0, 5.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.998046875, -0.967803955078125, -0.93756103515625, -0.907318115234375, -0.8770751953125, -0.846832275390625, -0.81658935546875, -0.786346435546875, -0.756103515625, -0.725860595703125, -0.69561767578125, -0.665374755859375, -0.6351318359375, -0.604888916015625, -0.57464599609375, -0.544403076171875, -0.51416015625, -0.483917236328125, -0.45367431640625, -0.423431396484375, -0.3931884765625, -0.362945556640625, -0.33270263671875, -0.302459716796875, -0.272216796875, -0.241973876953125, -0.21173095703125, -0.181488037109375, -0.1512451171875, -0.121002197265625, -0.09075927734375, -0.060516357421875, -0.0302734375, -3.0517578125e-05, 0.03021240234375, 0.060455322265625, 0.0906982421875, 0.120941162109375, 0.15118408203125, 0.181427001953125, 0.211669921875, 0.241912841796875, 0.27215576171875, 0.302398681640625, 0.3326416015625, 0.362884521484375, 0.39312744140625, 0.423370361328125, 0.45361328125, 0.483856201171875, 0.51409912109375, 0.544342041015625, 0.5745849609375, 0.604827880859375, 0.63507080078125, 0.665313720703125, 0.695556640625, 0.725799560546875, 0.75604248046875, 0.786285400390625, 0.8165283203125, 0.846771240234375, 0.87701416015625, 0.907257080078125, 0.9375]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 4.0, 8.0, 4.0, 7.0, 10.0, 12.0, 17.0, 29.0, 23.0, 23.0, 22.0, 28.0, 36.0, 62.0, 95.0, 149.0, 571.0, 20638.0, 1021067.0, 4841.0, 409.0, 134.0, 65.0, 51.0, 48.0, 34.0, 29.0, 30.0, 14.0, 25.0, 17.0, 10.0, 16.0, 12.0, 5.0, 7.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-4.66015625, -4.528411865234375, -4.39666748046875, -4.264923095703125, -4.1331787109375, -4.001434326171875, -3.86968994140625, -3.737945556640625, -3.606201171875, -3.474456787109375, -3.34271240234375, -3.210968017578125, -3.0792236328125, -2.947479248046875, -2.81573486328125, -2.683990478515625, -2.55224609375, -2.420501708984375, -2.28875732421875, -2.157012939453125, -2.0252685546875, -1.893524169921875, -1.76177978515625, -1.630035400390625, -1.498291015625, -1.366546630859375, -1.23480224609375, -1.103057861328125, -0.9713134765625, -0.839569091796875, -0.70782470703125, -0.576080322265625, -0.4443359375, -0.312591552734375, -0.18084716796875, -0.049102783203125, 0.0826416015625, 0.214385986328125, 0.34613037109375, 0.477874755859375, 0.609619140625, 0.741363525390625, 0.87310791015625, 1.004852294921875, 1.1365966796875, 1.268341064453125, 1.40008544921875, 1.531829833984375, 1.66357421875, 1.795318603515625, 1.92706298828125, 2.058807373046875, 2.1905517578125, 2.322296142578125, 2.45404052734375, 2.585784912109375, 2.717529296875, 2.849273681640625, 2.98101806640625, 3.112762451171875, 3.2445068359375, 3.376251220703125, 3.50799560546875, 3.639739990234375, 3.771484375]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 4.0, 5.0, 7.0, 5.0, 10.0, 5.0, 9.0, 15.0, 19.0, 17.0, 19.0, 32.0, 29.0, 25.0, 30.0, 31.0, 55.0, 47.0, 48.0, 37.0, 47.0, 52.0, 47.0, 46.0, 40.0, 39.0, 37.0, 32.0, 32.0, 16.0, 38.0, 16.0, 21.0, 19.0, 16.0, 16.0, 10.0, 13.0, 6.0, 8.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.072265625, -1.0425643920898438, -1.0128631591796875, -0.9831619262695312, -0.953460693359375, -0.9237594604492188, -0.8940582275390625, -0.8643569946289062, -0.83465576171875, -0.8049545288085938, -0.7752532958984375, -0.7455520629882812, -0.715850830078125, -0.6861495971679688, -0.6564483642578125, -0.6267471313476562, -0.5970458984375, -0.5673446655273438, -0.5376434326171875, -0.5079421997070312, -0.478240966796875, -0.44853973388671875, -0.4188385009765625, -0.38913726806640625, -0.35943603515625, -0.32973480224609375, -0.3000335693359375, -0.27033233642578125, -0.240631103515625, -0.21092987060546875, -0.1812286376953125, -0.15152740478515625, -0.121826171875, -0.09212493896484375, -0.0624237060546875, -0.03272247314453125, -0.003021240234375, 0.02667999267578125, 0.0563812255859375, 0.08608245849609375, 0.11578369140625, 0.14548492431640625, 0.1751861572265625, 0.20488739013671875, 0.234588623046875, 0.26428985595703125, 0.2939910888671875, 0.32369232177734375, 0.3533935546875, 0.38309478759765625, 0.4127960205078125, 0.44249725341796875, 0.472198486328125, 0.5018997192382812, 0.5316009521484375, 0.5613021850585938, 0.59100341796875, 0.6207046508789062, 0.6504058837890625, 0.6801071166992188, 0.709808349609375, 0.7395095825195312, 0.7692108154296875, 0.7989120483398438, 0.82861328125]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 8.0, 5.0, 10.0, 27.0, 36.0, 45.0, 94.0, 157.0, 322.0, 782.0, 2374.0, 10781.0, 97184.0, 872326.0, 53836.0, 7479.0, 1837.0, 634.0, 280.0, 152.0, 71.0, 45.0, 30.0, 13.0, 7.0, 10.0, 5.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6005859375, -0.5831222534179688, -0.5656585693359375, -0.5481948852539062, -0.530731201171875, -0.5132675170898438, -0.4958038330078125, -0.47834014892578125, -0.46087646484375, -0.44341278076171875, -0.4259490966796875, -0.40848541259765625, -0.391021728515625, -0.37355804443359375, -0.3560943603515625, -0.33863067626953125, -0.3211669921875, -0.30370330810546875, -0.2862396240234375, -0.26877593994140625, -0.251312255859375, -0.23384857177734375, -0.2163848876953125, -0.19892120361328125, -0.18145751953125, -0.16399383544921875, -0.1465301513671875, -0.12906646728515625, -0.111602783203125, -0.09413909912109375, -0.0766754150390625, -0.05921173095703125, -0.041748046875, -0.02428436279296875, -0.0068206787109375, 0.01064300537109375, 0.028106689453125, 0.04557037353515625, 0.0630340576171875, 0.08049774169921875, 0.09796142578125, 0.11542510986328125, 0.1328887939453125, 0.15035247802734375, 0.167816162109375, 0.18527984619140625, 0.2027435302734375, 0.22020721435546875, 0.2376708984375, 0.25513458251953125, 0.2725982666015625, 0.29006195068359375, 0.307525634765625, 0.32498931884765625, 0.3424530029296875, 0.35991668701171875, 0.37738037109375, 0.39484405517578125, 0.4123077392578125, 0.42977142333984375, 0.447235107421875, 0.46469879150390625, 0.4821624755859375, 0.49962615966796875, 0.51708984375]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 5.0, 1.0, 1.0, 5.0, 1.0, 4.0, 3.0, 2.0, 8.0, 2.0, 9.0, 8.0, 11.0, 18.0, 25.0, 34.0, 49.0, 37.0, 82.0, 110.0, 201.0, 118.0, 81.0, 53.0, 32.0, 26.0, 18.0, 9.0, 10.0, 12.0, 9.0, 7.0, 2.0, 1.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.571676254272461e-05, -4.416331648826599e-05, -4.260987043380737e-05, -4.1056424379348755e-05, -3.950297832489014e-05, -3.794953227043152e-05, -3.63960862159729e-05, -3.484264016151428e-05, -3.3289194107055664e-05, -3.1735748052597046e-05, -3.0182301998138428e-05, -2.862885594367981e-05, -2.707540988922119e-05, -2.5521963834762573e-05, -2.3968517780303955e-05, -2.2415071725845337e-05, -2.086162567138672e-05, -1.93081796169281e-05, -1.7754733562469482e-05, -1.6201287508010864e-05, -1.4647841453552246e-05, -1.3094395399093628e-05, -1.154094934463501e-05, -9.987503290176392e-06, -8.434057235717773e-06, -6.880611181259155e-06, -5.327165126800537e-06, -3.773719072341919e-06, -2.2202730178833008e-06, -6.668269634246826e-07, 8.866190910339355e-07, 2.4400651454925537e-06, 3.993511199951172e-06, 5.54695725440979e-06, 7.100403308868408e-06, 8.653849363327026e-06, 1.0207295417785645e-05, 1.1760741472244263e-05, 1.3314187526702881e-05, 1.4867633581161499e-05, 1.6421079635620117e-05, 1.7974525690078735e-05, 1.9527971744537354e-05, 2.108141779899597e-05, 2.263486385345459e-05, 2.4188309907913208e-05, 2.5741755962371826e-05, 2.7295202016830444e-05, 2.8848648071289062e-05, 3.040209412574768e-05, 3.19555401802063e-05, 3.350898623466492e-05, 3.5062432289123535e-05, 3.661587834358215e-05, 3.816932439804077e-05, 3.972277045249939e-05, 4.127621650695801e-05, 4.2829662561416626e-05, 4.4383108615875244e-05, 4.593655467033386e-05, 4.749000072479248e-05, 4.90434467792511e-05, 5.059689283370972e-05, 5.2150338888168335e-05, 5.370378494262695e-05]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 7.0, 4.0, 4.0, 12.0, 11.0, 20.0, 21.0, 42.0, 63.0, 94.0, 177.0, 339.0, 702.0, 1778.0, 5772.0, 23101.0, 160505.0, 761148.0, 74663.0, 13884.0, 3758.0, 1243.0, 546.0, 294.0, 134.0, 81.0, 47.0, 37.0, 24.0, 23.0, 13.0, 6.0, 5.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.333740234375, -0.32196044921875, -0.3101806640625, -0.29840087890625, -0.28662109375, -0.27484130859375, -0.2630615234375, -0.25128173828125, -0.239501953125, -0.22772216796875, -0.2159423828125, -0.20416259765625, -0.1923828125, -0.18060302734375, -0.1688232421875, -0.15704345703125, -0.145263671875, -0.13348388671875, -0.1217041015625, -0.10992431640625, -0.09814453125, -0.08636474609375, -0.0745849609375, -0.06280517578125, -0.051025390625, -0.03924560546875, -0.0274658203125, -0.01568603515625, -0.00390625, 0.00787353515625, 0.0196533203125, 0.03143310546875, 0.043212890625, 0.05499267578125, 0.0667724609375, 0.07855224609375, 0.09033203125, 0.10211181640625, 0.1138916015625, 0.12567138671875, 0.137451171875, 0.14923095703125, 0.1610107421875, 0.17279052734375, 0.1845703125, 0.19635009765625, 0.2081298828125, 0.21990966796875, 0.231689453125, 0.24346923828125, 0.2552490234375, 0.26702880859375, 0.27880859375, 0.29058837890625, 0.3023681640625, 0.31414794921875, 0.325927734375, 0.33770751953125, 0.3494873046875, 0.36126708984375, 0.373046875, 0.38482666015625, 0.3966064453125, 0.40838623046875, 0.420166015625]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 3.0, 4.0, 5.0, 5.0, 6.0, 8.0, 7.0, 12.0, 15.0, 23.0, 23.0, 26.0, 38.0, 66.0, 66.0, 124.0, 172.0, 117.0, 66.0, 62.0, 36.0, 28.0, 18.0, 12.0, 10.0, 10.0, 14.0, 5.0, 8.0, 7.0, 2.0, 0.0, 5.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1099853515625, -0.10611724853515625, -0.1022491455078125, -0.09838104248046875, -0.094512939453125, -0.09064483642578125, -0.0867767333984375, -0.08290863037109375, -0.07904052734375, -0.07517242431640625, -0.0713043212890625, -0.06743621826171875, -0.063568115234375, -0.05970001220703125, -0.0558319091796875, -0.05196380615234375, -0.048095703125, -0.04422760009765625, -0.0403594970703125, -0.03649139404296875, -0.032623291015625, -0.02875518798828125, -0.0248870849609375, -0.02101898193359375, -0.01715087890625, -0.01328277587890625, -0.0094146728515625, -0.00554656982421875, -0.001678466796875, 0.00218963623046875, 0.0060577392578125, 0.00992584228515625, 0.0137939453125, 0.01766204833984375, 0.0215301513671875, 0.02539825439453125, 0.029266357421875, 0.03313446044921875, 0.0370025634765625, 0.04087066650390625, 0.04473876953125, 0.04860687255859375, 0.0524749755859375, 0.05634307861328125, 0.060211181640625, 0.06407928466796875, 0.0679473876953125, 0.07181549072265625, 0.07568359375, 0.07955169677734375, 0.0834197998046875, 0.08728790283203125, 0.091156005859375, 0.09502410888671875, 0.0988922119140625, 0.10276031494140625, 0.10662841796875, 0.11049652099609375, 0.1143646240234375, 0.11823272705078125, 0.122100830078125, 0.12596893310546875, 0.1298370361328125, 0.13370513916015625, 0.1375732421875]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 29.0, 52.0, 150.0, 237.0, 264.0, 172.0, 69.0, 24.0, 4.0, 5.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-6.7317328453063965, -6.605012893676758, -6.478292465209961, -6.351572036743164, -6.224852085113525, -6.098132133483887, -5.97141170501709, -5.844691276550293, -5.717971324920654, -5.591251373291016, -5.464530944824219, -5.337810516357422, -5.211090564727783, -5.0843706130981445, -4.957650184631348, -4.830929756164551, -4.704209804534912, -4.577489852905273, -4.450769424438477, -4.32404899597168, -4.197329044342041, -4.070609092712402, -3.9438886642456055, -3.8171684741973877, -3.69044828414917, -3.563728094100952, -3.4370079040527344, -3.3102877140045166, -3.183567523956299, -3.056847333908081, -2.9301271438598633, -2.8034069538116455, -2.676687240600586, -2.549967050552368, -2.4232468605041504, -2.2965266704559326, -2.169806480407715, -2.043086290359497, -1.9163661003112793, -1.7896459102630615, -1.6629256010055542, -1.5362054109573364, -1.4094852209091187, -1.2827650308609009, -1.156044840812683, -1.0293246507644653, -0.9026044607162476, -0.7758842706680298, -0.649164080619812, -0.5224438905715942, -0.39572370052337646, -0.2690035104751587, -0.14228332042694092, -0.015563130378723145, 0.11115705966949463, 0.2378772497177124, 0.3645974397659302, 0.49131762981414795, 0.6180378198623657, 0.7447580099105835, 0.8714781999588013, 0.998198390007019, 1.1249185800552368, 1.2516387701034546, 1.3783589601516724]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 6.0, 2.0, 5.0, 8.0, 10.0, 11.0, 26.0, 19.0, 20.0, 19.0, 23.0, 33.0, 41.0, 37.0, 56.0, 44.0, 56.0, 46.0, 60.0, 63.0, 57.0, 53.0, 52.0, 42.0, 29.0, 37.0, 36.0, 23.0, 23.0, 24.0, 14.0, 9.0, 3.0, 12.0, 7.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.7252743244171143, -1.6719555854797363, -1.618636965751648, -1.56531822681427, -1.5119996070861816, -1.4586808681488037, -1.4053621292114258, -1.3520435094833374, -1.298724889755249, -1.245406150817871, -1.1920875310897827, -1.1387687921524048, -1.0854501724243164, -1.0321314334869385, -0.9788127541542053, -0.9254940748214722, -0.8721753358840942, -0.8188566565513611, -0.7655379772186279, -0.71221923828125, -0.6589006185531616, -0.6055818796157837, -0.5522632002830505, -0.4989445209503174, -0.44562584161758423, -0.3923071622848511, -0.3389884829521179, -0.2856697738170624, -0.23235109448432922, -0.17903241515159607, -0.12571370601654053, -0.07239502668380737, -0.01907634735107422, 0.03424233943223953, 0.08756102621555328, 0.14087972044944763, 0.1941983997821808, 0.24751707911491394, 0.3008357882499695, 0.35415446758270264, 0.4074731469154358, 0.46079182624816895, 0.5141105055809021, 0.5674291849136353, 0.6207479238510132, 0.6740665435791016, 0.7273852825164795, 0.7807039618492126, 0.8340226411819458, 0.887341320514679, 0.9406599998474121, 0.99397873878479, 1.0472973585128784, 1.1006160974502563, 1.1539347171783447, 1.2072534561157227, 1.2605721950531006, 1.3138909339904785, 1.367209553718567, 1.4205282926559448, 1.4738469123840332, 1.5271656513214111, 1.580484390258789, 1.6338030099868774, 1.6871216297149658]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 3.0, 8.0, 11.0, 17.0, 16.0, 26.0, 48.0, 83.0, 119.0, 200.0, 334.0, 601.0, 1136.0, 2304.0, 5282.0, 14796.0, 54261.0, 297547.0, 1568596.0, 1781274.0, 376908.0, 63946.0, 16164.0, 5655.0, 2355.0, 1118.0, 594.0, 280.0, 206.0, 134.0, 84.0, 57.0, 37.0, 31.0, 20.0, 9.0, 4.0, 9.0, 5.0, 4.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.845703125, -0.8193206787109375, -0.792938232421875, -0.7665557861328125, -0.74017333984375, -0.7137908935546875, -0.687408447265625, -0.6610260009765625, -0.6346435546875, -0.6082611083984375, -0.581878662109375, -0.5554962158203125, -0.52911376953125, -0.5027313232421875, -0.476348876953125, -0.4499664306640625, -0.423583984375, -0.3972015380859375, -0.370819091796875, -0.3444366455078125, -0.31805419921875, -0.2916717529296875, -0.265289306640625, -0.2389068603515625, -0.2125244140625, -0.1861419677734375, -0.159759521484375, -0.1333770751953125, -0.10699462890625, -0.0806121826171875, -0.054229736328125, -0.0278472900390625, -0.00146484375, 0.0249176025390625, 0.051300048828125, 0.0776824951171875, 0.10406494140625, 0.1304473876953125, 0.156829833984375, 0.1832122802734375, 0.2095947265625, 0.2359771728515625, 0.262359619140625, 0.2887420654296875, 0.31512451171875, 0.3415069580078125, 0.367889404296875, 0.3942718505859375, 0.420654296875, 0.4470367431640625, 0.473419189453125, 0.4998016357421875, 0.52618408203125, 0.5525665283203125, 0.578948974609375, 0.6053314208984375, 0.6317138671875, 0.6580963134765625, 0.684478759765625, 0.7108612060546875, 0.73724365234375, 0.7636260986328125, 0.790008544921875, 0.8163909912109375, 0.8427734375]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 4.0, 6.0, 6.0, 7.0, 8.0, 10.0, 16.0, 13.0, 18.0, 15.0, 24.0, 27.0, 35.0, 28.0, 34.0, 43.0, 45.0, 43.0, 50.0, 42.0, 45.0, 39.0, 54.0, 43.0, 38.0, 43.0, 45.0, 26.0, 29.0, 32.0, 22.0, 26.0, 10.0, 19.0, 14.0, 7.0, 11.0, 5.0, 12.0, 5.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0], "bins": [-0.646484375, -0.6278533935546875, -0.609222412109375, -0.5905914306640625, -0.57196044921875, -0.5533294677734375, -0.534698486328125, -0.5160675048828125, -0.4974365234375, -0.4788055419921875, -0.460174560546875, -0.4415435791015625, -0.42291259765625, -0.4042816162109375, -0.385650634765625, -0.3670196533203125, -0.348388671875, -0.3297576904296875, -0.311126708984375, -0.2924957275390625, -0.27386474609375, -0.2552337646484375, -0.236602783203125, -0.2179718017578125, -0.1993408203125, -0.1807098388671875, -0.162078857421875, -0.1434478759765625, -0.12481689453125, -0.1061859130859375, -0.087554931640625, -0.0689239501953125, -0.05029296875, -0.0316619873046875, -0.013031005859375, 0.0055999755859375, 0.02423095703125, 0.0428619384765625, 0.061492919921875, 0.0801239013671875, 0.0987548828125, 0.1173858642578125, 0.136016845703125, 0.1546478271484375, 0.17327880859375, 0.1919097900390625, 0.210540771484375, 0.2291717529296875, 0.247802734375, 0.2664337158203125, 0.285064697265625, 0.3036956787109375, 0.32232666015625, 0.3409576416015625, 0.359588623046875, 0.3782196044921875, 0.3968505859375, 0.4154815673828125, 0.434112548828125, 0.4527435302734375, 0.47137451171875, 0.4900054931640625, 0.508636474609375, 0.5272674560546875, 0.5458984375]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 4.0, 6.0, 7.0, 7.0, 8.0, 13.0, 19.0, 23.0, 44.0, 75.0, 154.0, 205.0, 471.0, 1299.0, 4671.0, 38342.0, 2397500.0, 1712165.0, 32552.0, 4486.0, 1242.0, 451.0, 183.0, 109.0, 74.0, 47.0, 36.0, 23.0, 21.0, 5.0, 9.0, 10.0, 5.0, 7.0, 6.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-2.064453125, -2.00860595703125, -1.9527587890625, -1.89691162109375, -1.841064453125, -1.78521728515625, -1.7293701171875, -1.67352294921875, -1.61767578125, -1.56182861328125, -1.5059814453125, -1.45013427734375, -1.394287109375, -1.33843994140625, -1.2825927734375, -1.22674560546875, -1.1708984375, -1.11505126953125, -1.0592041015625, -1.00335693359375, -0.947509765625, -0.89166259765625, -0.8358154296875, -0.77996826171875, -0.72412109375, -0.66827392578125, -0.6124267578125, -0.55657958984375, -0.500732421875, -0.44488525390625, -0.3890380859375, -0.33319091796875, -0.27734375, -0.22149658203125, -0.1656494140625, -0.10980224609375, -0.053955078125, 0.00189208984375, 0.0577392578125, 0.11358642578125, 0.16943359375, 0.22528076171875, 0.2811279296875, 0.33697509765625, 0.392822265625, 0.44866943359375, 0.5045166015625, 0.56036376953125, 0.6162109375, 0.67205810546875, 0.7279052734375, 0.78375244140625, 0.839599609375, 0.89544677734375, 0.9512939453125, 1.00714111328125, 1.06298828125, 1.11883544921875, 1.1746826171875, 1.23052978515625, 1.286376953125, 1.34222412109375, 1.3980712890625, 1.45391845703125, 1.509765625]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 5.0, 3.0, 7.0, 6.0, 10.0, 16.0, 20.0, 22.0, 34.0, 59.0, 89.0, 118.0, 185.0, 306.0, 437.0, 582.0, 672.0, 515.0, 332.0, 216.0, 141.0, 94.0, 64.0, 51.0, 24.0, 21.0, 12.0, 11.0, 6.0, 1.0, 9.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.255615234375, -0.24585342407226562, -0.23609161376953125, -0.22632980346679688, -0.2165679931640625, -0.20680618286132812, -0.19704437255859375, -0.18728256225585938, -0.177520751953125, -0.16775894165039062, -0.15799713134765625, -0.14823532104492188, -0.1384735107421875, -0.12871170043945312, -0.11894989013671875, -0.10918807983398438, -0.09942626953125, -0.08966445922851562, -0.07990264892578125, -0.07014083862304688, -0.0603790283203125, -0.050617218017578125, -0.04085540771484375, -0.031093597412109375, -0.021331787109375, -0.011569976806640625, -0.00180816650390625, 0.007953643798828125, 0.0177154541015625, 0.027477264404296875, 0.03723907470703125, 0.047000885009765625, 0.0567626953125, 0.06652450561523438, 0.07628631591796875, 0.08604812622070312, 0.0958099365234375, 0.10557174682617188, 0.11533355712890625, 0.12509536743164062, 0.134857177734375, 0.14461898803710938, 0.15438079833984375, 0.16414260864257812, 0.1739044189453125, 0.18366622924804688, 0.19342803955078125, 0.20318984985351562, 0.21295166015625, 0.22271347045898438, 0.23247528076171875, 0.24223709106445312, 0.2519989013671875, 0.2617607116699219, 0.27152252197265625, 0.2812843322753906, 0.291046142578125, 0.3008079528808594, 0.31056976318359375, 0.3203315734863281, 0.3300933837890625, 0.3398551940917969, 0.34961700439453125, 0.3593788146972656, 0.369140625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 5.0, 7.0, 5.0, 10.0, 21.0, 34.0, 34.0, 62.0, 93.0, 116.0, 133.0, 117.0, 98.0, 91.0, 71.0, 50.0, 25.0, 14.0, 11.0, 9.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.818373441696167, -1.772924780845642, -1.7274761199951172, -1.6820274591445923, -1.6365787982940674, -1.5911301374435425, -1.5456814765930176, -1.5002328157424927, -1.4547841548919678, -1.4093354940414429, -1.363886833190918, -1.318438172340393, -1.2729895114898682, -1.2275408506393433, -1.1820921897888184, -1.1366435289382935, -1.0911948680877686, -1.0457462072372437, -1.0002975463867188, -0.9548488855361938, -0.909400224685669, -0.863951563835144, -0.8185029029846191, -0.7730542421340942, -0.7276055812835693, -0.6821569204330444, -0.6367082595825195, -0.5912595987319946, -0.5458109378814697, -0.5003622770309448, -0.4549136161804199, -0.409464955329895, -0.3640162944793701, -0.3185676336288452, -0.2731189727783203, -0.2276703119277954, -0.1822216510772705, -0.1367729902267456, -0.0913243293762207, -0.0458756685256958, -0.00042700767517089844, 0.045021653175354004, 0.0904703140258789, 0.1359189748764038, 0.1813676357269287, 0.2268162965774536, 0.2722649574279785, 0.3177136182785034, 0.3631622791290283, 0.4086109399795532, 0.4540596008300781, 0.499508261680603, 0.5449569225311279, 0.5904055833816528, 0.6358542442321777, 0.6813029050827026, 0.7267515659332275, 0.7722002267837524, 0.8176488876342773, 0.8630975484848022, 0.9085462093353271, 0.953994870185852, 0.999443531036377, 1.0448921918869019, 1.0903408527374268]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 4.0, 4.0, 2.0, 1.0, 9.0, 3.0, 8.0, 8.0, 10.0, 13.0, 19.0, 18.0, 20.0, 26.0, 27.0, 24.0, 30.0, 38.0, 49.0, 40.0, 42.0, 49.0, 55.0, 52.0, 40.0, 42.0, 44.0, 38.0, 35.0, 29.0, 35.0, 38.0, 30.0, 25.0, 19.0, 12.0, 14.0, 11.0, 7.0, 7.0, 6.0, 5.0, 5.0, 2.0, 3.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.6541244387626648, -0.6333881616592407, -0.6126518845558167, -0.5919156074523926, -0.5711793303489685, -0.5504430532455444, -0.5297067761421204, -0.5089704990386963, -0.4882342517375946, -0.46749797463417053, -0.44676169753074646, -0.4260254204273224, -0.4052891731262207, -0.38455289602279663, -0.36381661891937256, -0.3430803418159485, -0.3223440647125244, -0.30160778760910034, -0.28087151050567627, -0.2601352334022522, -0.23939897119998932, -0.21866269409656525, -0.19792643189430237, -0.1771901547908783, -0.15645387768745422, -0.13571760058403015, -0.11498133093118668, -0.0942450612783432, -0.07350878417491913, -0.052772507071495056, -0.03203623741865158, -0.011299967765808105, 0.009436309337615967, 0.03017258271574974, 0.050908856093883514, 0.07164512574672699, 0.09238140285015106, 0.11311767995357513, 0.133853942155838, 0.15459021925926208, 0.17532649636268616, 0.19606277346611023, 0.2167990505695343, 0.23753531277179718, 0.25827157497406006, 0.27900785207748413, 0.2997441291809082, 0.3204804062843323, 0.34121668338775635, 0.3619529604911804, 0.3826892375946045, 0.40342551469802856, 0.42416179180145264, 0.4448980689048767, 0.4656343162059784, 0.48637059330940247, 0.5071069002151489, 0.527843177318573, 0.5485794544219971, 0.5693157315254211, 0.5900520086288452, 0.6107882857322693, 0.6315245628356934, 0.6522607803344727, 0.6729970574378967]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 5.0, 8.0, 8.0, 12.0, 15.0, 32.0, 78.0, 156.0, 429.0, 1588.0, 5814.0, 26786.0, 356382.0, 610154.0, 36789.0, 7485.0, 1899.0, 549.0, 192.0, 72.0, 30.0, 32.0, 11.0, 9.0, 4.0, 6.0, 2.0, 2.0, 4.0, 1.0, 1.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8251953125, -0.8002548217773438, -0.7753143310546875, -0.7503738403320312, -0.725433349609375, -0.7004928588867188, -0.6755523681640625, -0.6506118774414062, -0.62567138671875, -0.6007308959960938, -0.5757904052734375, -0.5508499145507812, -0.525909423828125, -0.5009689331054688, -0.4760284423828125, -0.45108795166015625, -0.4261474609375, -0.40120697021484375, -0.3762664794921875, -0.35132598876953125, -0.326385498046875, -0.30144500732421875, -0.2765045166015625, -0.25156402587890625, -0.22662353515625, -0.20168304443359375, -0.1767425537109375, -0.15180206298828125, -0.126861572265625, -0.10192108154296875, -0.0769805908203125, -0.05204010009765625, -0.027099609375, -0.00215911865234375, 0.0227813720703125, 0.04772186279296875, 0.072662353515625, 0.09760284423828125, 0.1225433349609375, 0.14748382568359375, 0.17242431640625, 0.19736480712890625, 0.2223052978515625, 0.24724578857421875, 0.272186279296875, 0.29712677001953125, 0.3220672607421875, 0.34700775146484375, 0.3719482421875, 0.39688873291015625, 0.4218292236328125, 0.44676971435546875, 0.471710205078125, 0.49665069580078125, 0.5215911865234375, 0.5465316772460938, 0.57147216796875, 0.5964126586914062, 0.6213531494140625, 0.6462936401367188, 0.671234130859375, 0.6961746215820312, 0.7211151123046875, 0.7460556030273438, 0.77099609375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 0.0, 2.0, 1.0, 4.0, 7.0, 2.0, 18.0, 11.0, 15.0, 23.0, 28.0, 34.0, 41.0, 37.0, 49.0, 56.0, 67.0, 70.0, 63.0, 65.0, 58.0, 49.0, 48.0, 53.0, 36.0, 41.0, 23.0, 25.0, 18.0, 17.0, 12.0, 7.0, 6.0, 3.0, 2.0, 4.0, 3.0, 2.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3955078125, -0.3795318603515625, -0.363555908203125, -0.3475799560546875, -0.33160400390625, -0.3156280517578125, -0.299652099609375, -0.2836761474609375, -0.2677001953125, -0.2517242431640625, -0.235748291015625, -0.2197723388671875, -0.20379638671875, -0.1878204345703125, -0.171844482421875, -0.1558685302734375, -0.139892578125, -0.1239166259765625, -0.107940673828125, -0.0919647216796875, -0.07598876953125, -0.0600128173828125, -0.044036865234375, -0.0280609130859375, -0.0120849609375, 0.0038909912109375, 0.019866943359375, 0.0358428955078125, 0.05181884765625, 0.0677947998046875, 0.083770751953125, 0.0997467041015625, 0.11572265625, 0.1316986083984375, 0.147674560546875, 0.1636505126953125, 0.17962646484375, 0.1956024169921875, 0.211578369140625, 0.2275543212890625, 0.2435302734375, 0.2595062255859375, 0.275482177734375, 0.2914581298828125, 0.30743408203125, 0.3234100341796875, 0.339385986328125, 0.3553619384765625, 0.371337890625, 0.3873138427734375, 0.403289794921875, 0.4192657470703125, 0.43524169921875, 0.4512176513671875, 0.467193603515625, 0.4831695556640625, 0.4991455078125, 0.5151214599609375, 0.531097412109375, 0.5470733642578125, 0.56304931640625, 0.5790252685546875, 0.595001220703125, 0.6109771728515625, 0.626953125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 3.0, 5.0, 11.0, 16.0, 17.0, 17.0, 42.0, 56.0, 62.0, 100.0, 159.0, 241.0, 357.0, 554.0, 919.0, 1515.0, 2636.0, 4955.0, 9650.0, 18957.0, 41613.0, 102555.0, 259863.0, 331754.0, 157890.0, 60422.0, 26368.0, 12604.0, 6546.0, 3534.0, 1960.0, 1110.0, 697.0, 440.0, 317.0, 191.0, 123.0, 98.0, 51.0, 44.0, 32.0, 17.0, 15.0, 10.0, 12.0, 6.0, 2.0, 3.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.1614990234375, -0.15615463256835938, -0.15081024169921875, -0.14546585083007812, -0.1401214599609375, -0.13477706909179688, -0.12943267822265625, -0.12408828735351562, -0.118743896484375, -0.11339950561523438, -0.10805511474609375, -0.10271072387695312, -0.0973663330078125, -0.09202194213867188, -0.08667755126953125, -0.08133316040039062, -0.07598876953125, -0.07064437866210938, -0.06529998779296875, -0.059955596923828125, -0.0546112060546875, -0.049266815185546875, -0.04392242431640625, -0.038578033447265625, -0.033233642578125, -0.027889251708984375, -0.02254486083984375, -0.017200469970703125, -0.0118560791015625, -0.006511688232421875, -0.00116729736328125, 0.004177093505859375, 0.009521484375, 0.014865875244140625, 0.02021026611328125, 0.025554656982421875, 0.0308990478515625, 0.036243438720703125, 0.04158782958984375, 0.046932220458984375, 0.052276611328125, 0.057621002197265625, 0.06296539306640625, 0.06830978393554688, 0.0736541748046875, 0.07899856567382812, 0.08434295654296875, 0.08968734741210938, 0.09503173828125, 0.10037612915039062, 0.10572052001953125, 0.11106491088867188, 0.1164093017578125, 0.12175369262695312, 0.12709808349609375, 0.13244247436523438, 0.137786865234375, 0.14313125610351562, 0.14847564697265625, 0.15382003784179688, 0.1591644287109375, 0.16450881958007812, 0.16985321044921875, 0.17519760131835938, 0.1805419921875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 1.0, 2.0, 12.0, 9.0, 11.0, 9.0, 15.0, 25.0, 18.0, 24.0, 35.0, 35.0, 26.0, 48.0, 44.0, 39.0, 44.0, 47.0, 47.0, 48.0, 54.0, 55.0, 41.0, 39.0, 39.0, 38.0, 35.0, 32.0, 24.0, 21.0, 9.0, 17.0, 5.0, 11.0, 10.0, 7.0, 4.0, 6.0, 8.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.849609375, -0.8239212036132812, -0.7982330322265625, -0.7725448608398438, -0.746856689453125, -0.7211685180664062, -0.6954803466796875, -0.6697921752929688, -0.64410400390625, -0.6184158325195312, -0.5927276611328125, -0.5670394897460938, -0.541351318359375, -0.5156631469726562, -0.4899749755859375, -0.46428680419921875, -0.4385986328125, -0.41291046142578125, -0.3872222900390625, -0.36153411865234375, -0.335845947265625, -0.31015777587890625, -0.2844696044921875, -0.25878143310546875, -0.23309326171875, -0.20740509033203125, -0.1817169189453125, -0.15602874755859375, -0.130340576171875, -0.10465240478515625, -0.0789642333984375, -0.05327606201171875, -0.027587890625, -0.00189971923828125, 0.0237884521484375, 0.04947662353515625, 0.075164794921875, 0.10085296630859375, 0.1265411376953125, 0.15222930908203125, 0.17791748046875, 0.20360565185546875, 0.2292938232421875, 0.25498199462890625, 0.280670166015625, 0.30635833740234375, 0.3320465087890625, 0.35773468017578125, 0.3834228515625, 0.40911102294921875, 0.4347991943359375, 0.46048736572265625, 0.486175537109375, 0.5118637084960938, 0.5375518798828125, 0.5632400512695312, 0.58892822265625, 0.6146163940429688, 0.6403045654296875, 0.6659927368164062, 0.691680908203125, 0.7173690795898438, 0.7430572509765625, 0.7687454223632812, 0.79443359375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 11.0, 18.0, 17.0, 29.0, 57.0, 81.0, 155.0, 291.0, 591.0, 1199.0, 2858.0, 7305.0, 21363.0, 79683.0, 327958.0, 434804.0, 123545.0, 31667.0, 10162.0, 3553.0, 1590.0, 747.0, 376.0, 209.0, 101.0, 79.0, 33.0, 28.0, 16.0, 10.0, 7.0, 3.0, 6.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07183837890625, -0.06960391998291016, -0.06736946105957031, -0.06513500213623047, -0.06290054321289062, -0.06066608428955078, -0.05843162536621094, -0.056197166442871094, -0.05396270751953125, -0.051728248596191406, -0.04949378967285156, -0.04725933074951172, -0.045024871826171875, -0.04279041290283203, -0.04055595397949219, -0.038321495056152344, -0.0360870361328125, -0.033852577209472656, -0.03161811828613281, -0.02938365936279297, -0.027149200439453125, -0.02491474151611328, -0.022680282592773438, -0.020445823669433594, -0.01821136474609375, -0.015976905822753906, -0.013742446899414062, -0.011507987976074219, -0.009273529052734375, -0.007039070129394531, -0.0048046112060546875, -0.0025701522827148438, -0.000335693359375, 0.0018987655639648438, 0.0041332244873046875, 0.006367683410644531, 0.008602142333984375, 0.010836601257324219, 0.013071060180664062, 0.015305519104003906, 0.01753997802734375, 0.019774436950683594, 0.022008895874023438, 0.02424335479736328, 0.026477813720703125, 0.02871227264404297, 0.030946731567382812, 0.033181190490722656, 0.0354156494140625, 0.037650108337402344, 0.03988456726074219, 0.04211902618408203, 0.044353485107421875, 0.04658794403076172, 0.04882240295410156, 0.051056861877441406, 0.05329132080078125, 0.055525779724121094, 0.05776023864746094, 0.05999469757080078, 0.062229156494140625, 0.06446361541748047, 0.06669807434082031, 0.06893253326416016, 0.0711669921875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 4.0, 4.0, 4.0, 3.0, 7.0, 5.0, 9.0, 6.0, 12.0, 17.0, 29.0, 19.0, 40.0, 57.0, 84.0, 94.0, 113.0, 123.0, 90.0, 101.0, 55.0, 39.0, 24.0, 15.0, 14.0, 15.0, 8.0, 2.0, 6.0, 1.0, 3.0, 1.0, 2.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.337860107421875e-05, -3.192480653524399e-05, -3.0471011996269226e-05, -2.9017217457294464e-05, -2.7563422918319702e-05, -2.610962837934494e-05, -2.4655833840370178e-05, -2.3202039301395416e-05, -2.1748244762420654e-05, -2.0294450223445892e-05, -1.884065568447113e-05, -1.738686114549637e-05, -1.5933066606521606e-05, -1.4479272067546844e-05, -1.3025477528572083e-05, -1.157168298959732e-05, -1.0117888450622559e-05, -8.664093911647797e-06, -7.210299372673035e-06, -5.756504833698273e-06, -4.302710294723511e-06, -2.8489157557487488e-06, -1.3951212167739868e-06, 5.8673322200775146e-08, 1.5124678611755371e-06, 2.966262400150299e-06, 4.420056939125061e-06, 5.873851478099823e-06, 7.327646017074585e-06, 8.781440556049347e-06, 1.0235235095024109e-05, 1.1689029633998871e-05, 1.3142824172973633e-05, 1.4596618711948395e-05, 1.6050413250923157e-05, 1.750420778989792e-05, 1.895800232887268e-05, 2.0411796867847443e-05, 2.1865591406822205e-05, 2.3319385945796967e-05, 2.477318048477173e-05, 2.622697502374649e-05, 2.7680769562721252e-05, 2.9134564101696014e-05, 3.0588358640670776e-05, 3.204215317964554e-05, 3.34959477186203e-05, 3.494974225759506e-05, 3.6403536796569824e-05, 3.7857331335544586e-05, 3.931112587451935e-05, 4.076492041349411e-05, 4.221871495246887e-05, 4.3672509491443634e-05, 4.5126304030418396e-05, 4.658009856939316e-05, 4.803389310836792e-05, 4.948768764734268e-05, 5.0941482186317444e-05, 5.2395276725292206e-05, 5.384907126426697e-05, 5.530286580324173e-05, 5.675666034221649e-05, 5.8210454881191254e-05, 5.9664249420166016e-05]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 6.0, 5.0, 8.0, 8.0, 11.0, 29.0, 48.0, 91.0, 165.0, 414.0, 1247.0, 4424.0, 20379.0, 164937.0, 692577.0, 140040.0, 18233.0, 4042.0, 1143.0, 394.0, 133.0, 89.0, 56.0, 19.0, 23.0, 11.0, 9.0, 7.0, 2.0, 2.0, 1.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.120361328125, -0.11653614044189453, -0.11271095275878906, -0.1088857650756836, -0.10506057739257812, -0.10123538970947266, -0.09741020202636719, -0.09358501434326172, -0.08975982666015625, -0.08593463897705078, -0.08210945129394531, -0.07828426361083984, -0.07445907592773438, -0.0706338882446289, -0.06680870056152344, -0.06298351287841797, -0.0591583251953125, -0.05533313751220703, -0.05150794982910156, -0.047682762145996094, -0.043857574462890625, -0.040032386779785156, -0.03620719909667969, -0.03238201141357422, -0.02855682373046875, -0.02473163604736328, -0.020906448364257812, -0.017081260681152344, -0.013256072998046875, -0.009430885314941406, -0.0056056976318359375, -0.0017805099487304688, 0.002044677734375, 0.005869865417480469, 0.009695053100585938, 0.013520240783691406, 0.017345428466796875, 0.021170616149902344, 0.024995803833007812, 0.02882099151611328, 0.03264617919921875, 0.03647136688232422, 0.04029655456542969, 0.044121742248535156, 0.047946929931640625, 0.051772117614746094, 0.05559730529785156, 0.05942249298095703, 0.0632476806640625, 0.06707286834716797, 0.07089805603027344, 0.0747232437133789, 0.07854843139648438, 0.08237361907958984, 0.08619880676269531, 0.09002399444580078, 0.09384918212890625, 0.09767436981201172, 0.10149955749511719, 0.10532474517822266, 0.10914993286132812, 0.1129751205444336, 0.11680030822753906, 0.12062549591064453, 0.12445068359375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 6.0, 2.0, 5.0, 6.0, 9.0, 19.0, 21.0, 29.0, 35.0, 35.0, 57.0, 51.0, 80.0, 96.0, 91.0, 85.0, 75.0, 59.0, 58.0, 48.0, 28.0, 21.0, 15.0, 9.0, 14.0, 10.0, 8.0, 4.0, 3.0, 5.0, 8.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0178070068359375, -0.017240524291992188, -0.016674041748046875, -0.016107559204101562, -0.01554107666015625, -0.014974594116210938, -0.014408111572265625, -0.013841629028320312, -0.013275146484375, -0.012708663940429688, -0.012142181396484375, -0.011575698852539062, -0.01100921630859375, -0.010442733764648438, -0.009876251220703125, -0.009309768676757812, -0.0087432861328125, -0.008176803588867188, -0.007610321044921875, -0.0070438385009765625, -0.00647735595703125, -0.0059108734130859375, -0.005344390869140625, -0.0047779083251953125, -0.00421142578125, -0.0036449432373046875, -0.003078460693359375, -0.0025119781494140625, -0.00194549560546875, -0.0013790130615234375, -0.000812530517578125, -0.0002460479736328125, 0.0003204345703125, 0.0008869171142578125, 0.001453399658203125, 0.0020198822021484375, 0.00258636474609375, 0.0031528472900390625, 0.003719329833984375, 0.0042858123779296875, 0.004852294921875, 0.0054187774658203125, 0.005985260009765625, 0.0065517425537109375, 0.00711822509765625, 0.0076847076416015625, 0.008251190185546875, 0.008817672729492188, 0.0093841552734375, 0.009950637817382812, 0.010517120361328125, 0.011083602905273438, 0.01165008544921875, 0.012216567993164062, 0.012783050537109375, 0.013349533081054688, 0.013916015625, 0.014482498168945312, 0.015048980712890625, 0.015615463256835938, 0.01618194580078125, 0.016748428344726562, 0.017314910888671875, 0.017881393432617188, 0.0184478759765625]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 11.0, 16.0, 39.0, 97.0, 209.0, 236.0, 204.0, 104.0, 58.0, 17.0, 12.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.0388071537017822, -1.9919952154159546, -1.9451831579208374, -1.8983712196350098, -1.8515591621398926, -1.804747223854065, -1.7579352855682373, -1.7111232280731201, -1.6643112897872925, -1.6174993515014648, -1.5706872940063477, -1.52387535572052, -1.4770632982254028, -1.4302513599395752, -1.383439302444458, -1.3366273641586304, -1.2898154258728027, -1.243003487586975, -1.196191430091858, -1.1493794918060303, -1.102567434310913, -1.0557554960250854, -1.0089435577392578, -0.9621315002441406, -0.9153194427490234, -0.868507444858551, -0.8216954469680786, -0.774883508682251, -0.7280715107917786, -0.6812595129013062, -0.6344475150108337, -0.5876355171203613, -0.5408235788345337, -0.4940115809440613, -0.44719961285591125, -0.40038761496543884, -0.3535756468772888, -0.3067636489868164, -0.259951651096344, -0.21313968300819397, -0.16632768511772156, -0.11951570212841034, -0.07270371168851852, -0.02589172124862671, 0.02092026174068451, 0.06773224472999573, 0.11454424262046814, 0.16135621070861816, 0.20816820859909058, 0.254980206489563, 0.301792174577713, 0.3486041724681854, 0.39541614055633545, 0.44222813844680786, 0.4890401363372803, 0.5358520746231079, 0.5826641321182251, 0.6294761300086975, 0.6762881278991699, 0.7231000661849976, 0.76991206407547, 0.8167240619659424, 0.8635360598564148, 0.9103480577468872, 0.9571599960327148]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 0.0, 4.0, 1.0, 5.0, 3.0, 2.0, 6.0, 5.0, 5.0, 8.0, 16.0, 15.0, 22.0, 22.0, 30.0, 25.0, 38.0, 35.0, 41.0, 63.0, 34.0, 64.0, 54.0, 61.0, 48.0, 58.0, 44.0, 46.0, 29.0, 39.0, 33.0, 35.0, 26.0, 18.0, 15.0, 11.0, 11.0, 10.0, 6.0, 2.0, 3.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 5.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3494338393211365, -0.3361285626888275, -0.32282325625419617, -0.3095179796218872, -0.29621270298957825, -0.2829073965549469, -0.26960211992263794, -0.2562968134880066, -0.24299153685569763, -0.22968624532222748, -0.21638096868991852, -0.20307567715644836, -0.1897703856229782, -0.17646509408950806, -0.1631598174571991, -0.14985452592372894, -0.13654924929141998, -0.12324396520853043, -0.10993867367506027, -0.09663338959217072, -0.08332809805870056, -0.070022813975811, -0.05671752989292145, -0.043412238359451294, -0.030106954276561737, -0.01680166646838188, -0.0034963805228471756, 0.00980890542268753, 0.023114193230867386, 0.03641948103904724, 0.0497247651219368, 0.06303005665540695, 0.07633534073829651, 0.08964062482118607, 0.10294591635465622, 0.11625120043754578, 0.12955649197101593, 0.14286178350448608, 0.15616706013679504, 0.1694723516702652, 0.18277764320373535, 0.1960829347372055, 0.20938821136951447, 0.22269350290298462, 0.23599879443645477, 0.24930408596992493, 0.2626093626022339, 0.27591466903686523, 0.2892199158668518, 0.30252519249916077, 0.3158304989337921, 0.3291357755661011, 0.34244105219841003, 0.3557463586330414, 0.36905163526535034, 0.3823569416999817, 0.39566221833229065, 0.4089674949645996, 0.42227280139923096, 0.4355780780315399, 0.4488833546638489, 0.4621886610984802, 0.4754939377307892, 0.48879921436309814, 0.5021045207977295]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 8.0, 7.0, 5.0, 12.0, 16.0, 35.0, 48.0, 88.0, 158.0, 334.0, 584.0, 1163.0, 2463.0, 5847.0, 15189.0, 48055.0, 213310.0, 565713.0, 140299.0, 34796.0, 11593.0, 4702.0, 2144.0, 917.0, 464.0, 237.0, 161.0, 85.0, 46.0, 29.0, 18.0, 17.0, 4.0, 5.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.87060546875, -0.8459930419921875, -0.821380615234375, -0.7967681884765625, -0.77215576171875, -0.7475433349609375, -0.722930908203125, -0.6983184814453125, -0.6737060546875, -0.6490936279296875, -0.624481201171875, -0.5998687744140625, -0.57525634765625, -0.5506439208984375, -0.526031494140625, -0.5014190673828125, -0.476806640625, -0.4521942138671875, -0.427581787109375, -0.4029693603515625, -0.37835693359375, -0.3537445068359375, -0.329132080078125, -0.3045196533203125, -0.2799072265625, -0.2552947998046875, -0.230682373046875, -0.2060699462890625, -0.18145751953125, -0.1568450927734375, -0.132232666015625, -0.1076202392578125, -0.0830078125, -0.0583953857421875, -0.033782958984375, -0.0091705322265625, 0.01544189453125, 0.0400543212890625, 0.064666748046875, 0.0892791748046875, 0.1138916015625, 0.1385040283203125, 0.163116455078125, 0.1877288818359375, 0.21234130859375, 0.2369537353515625, 0.261566162109375, 0.2861785888671875, 0.310791015625, 0.3354034423828125, 0.360015869140625, 0.3846282958984375, 0.40924072265625, 0.4338531494140625, 0.458465576171875, 0.4830780029296875, 0.5076904296875, 0.5323028564453125, 0.556915283203125, 0.5815277099609375, 0.60614013671875, 0.6307525634765625, 0.655364990234375, 0.6799774169921875, 0.70458984375]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 2.0, 2.0, 3.0, 5.0, 1.0, 9.0, 1.0, 5.0, 3.0, 10.0, 10.0, 12.0, 26.0, 16.0, 42.0, 32.0, 34.0, 33.0, 42.0, 42.0, 45.0, 60.0, 64.0, 48.0, 54.0, 40.0, 44.0, 42.0, 41.0, 44.0, 37.0, 27.0, 29.0, 23.0, 11.0, 16.0, 12.0, 7.0, 9.0, 5.0, 4.0, 4.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.61279296875, -0.5895843505859375, -0.566375732421875, -0.5431671142578125, -0.51995849609375, -0.4967498779296875, -0.473541259765625, -0.4503326416015625, -0.4271240234375, -0.4039154052734375, -0.380706787109375, -0.3574981689453125, -0.33428955078125, -0.3110809326171875, -0.287872314453125, -0.2646636962890625, -0.241455078125, -0.2182464599609375, -0.195037841796875, -0.1718292236328125, -0.14862060546875, -0.1254119873046875, -0.102203369140625, -0.0789947509765625, -0.0557861328125, -0.0325775146484375, -0.009368896484375, 0.0138397216796875, 0.03704833984375, 0.0602569580078125, 0.083465576171875, 0.1066741943359375, 0.1298828125, 0.1530914306640625, 0.176300048828125, 0.1995086669921875, 0.22271728515625, 0.2459259033203125, 0.269134521484375, 0.2923431396484375, 0.3155517578125, 0.3387603759765625, 0.361968994140625, 0.3851776123046875, 0.40838623046875, 0.4315948486328125, 0.454803466796875, 0.4780120849609375, 0.501220703125, 0.5244293212890625, 0.547637939453125, 0.5708465576171875, 0.59405517578125, 0.6172637939453125, 0.640472412109375, 0.6636810302734375, 0.6868896484375, 0.7100982666015625, 0.733306884765625, 0.7565155029296875, 0.77972412109375, 0.8029327392578125, 0.826141357421875, 0.8493499755859375, 0.87255859375]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 5.0, 3.0, 4.0, 6.0, 8.0, 18.0, 18.0, 20.0, 21.0, 25.0, 22.0, 29.0, 43.0, 57.0, 67.0, 98.0, 138.0, 220.0, 492.0, 1987.0, 21672.0, 795846.0, 217275.0, 8336.0, 1095.0, 374.0, 162.0, 126.0, 77.0, 64.0, 46.0, 46.0, 25.0, 20.0, 24.0, 19.0, 16.0, 11.0, 11.0, 3.0, 7.0, 4.0, 7.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8251953125, -1.7639923095703125, -1.702789306640625, -1.6415863037109375, -1.58038330078125, -1.5191802978515625, -1.457977294921875, -1.3967742919921875, -1.3355712890625, -1.2743682861328125, -1.213165283203125, -1.1519622802734375, -1.09075927734375, -1.0295562744140625, -0.968353271484375, -0.9071502685546875, -0.845947265625, -0.7847442626953125, -0.723541259765625, -0.6623382568359375, -0.60113525390625, -0.5399322509765625, -0.478729248046875, -0.4175262451171875, -0.3563232421875, -0.2951202392578125, -0.233917236328125, -0.1727142333984375, -0.11151123046875, -0.0503082275390625, 0.010894775390625, 0.0720977783203125, 0.13330078125, 0.1945037841796875, 0.255706787109375, 0.3169097900390625, 0.37811279296875, 0.4393157958984375, 0.500518798828125, 0.5617218017578125, 0.6229248046875, 0.6841278076171875, 0.745330810546875, 0.8065338134765625, 0.86773681640625, 0.9289398193359375, 0.990142822265625, 1.0513458251953125, 1.112548828125, 1.1737518310546875, 1.234954833984375, 1.2961578369140625, 1.35736083984375, 1.4185638427734375, 1.479766845703125, 1.5409698486328125, 1.6021728515625, 1.6633758544921875, 1.724578857421875, 1.7857818603515625, 1.84698486328125, 1.9081878662109375, 1.969390869140625, 2.0305938720703125, 2.091796875]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 2.0, 3.0, 6.0, 9.0, 8.0, 7.0, 7.0, 19.0, 18.0, 13.0, 22.0, 34.0, 35.0, 34.0, 36.0, 31.0, 42.0, 44.0, 35.0, 40.0, 50.0, 53.0, 39.0, 45.0, 53.0, 43.0, 36.0, 32.0, 33.0, 21.0, 31.0, 17.0, 14.0, 17.0, 15.0, 9.0, 11.0, 13.0, 5.0, 10.0, 4.0, 5.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.794921875, -0.7722625732421875, -0.749603271484375, -0.7269439697265625, -0.70428466796875, -0.6816253662109375, -0.658966064453125, -0.6363067626953125, -0.6136474609375, -0.5909881591796875, -0.568328857421875, -0.5456695556640625, -0.52301025390625, -0.5003509521484375, -0.477691650390625, -0.4550323486328125, -0.432373046875, -0.4097137451171875, -0.387054443359375, -0.3643951416015625, -0.34173583984375, -0.3190765380859375, -0.296417236328125, -0.2737579345703125, -0.2510986328125, -0.2284393310546875, -0.205780029296875, -0.1831207275390625, -0.16046142578125, -0.1378021240234375, -0.115142822265625, -0.0924835205078125, -0.06982421875, -0.0471649169921875, -0.024505615234375, -0.0018463134765625, 0.02081298828125, 0.0434722900390625, 0.066131591796875, 0.0887908935546875, 0.1114501953125, 0.1341094970703125, 0.156768798828125, 0.1794281005859375, 0.20208740234375, 0.2247467041015625, 0.247406005859375, 0.2700653076171875, 0.292724609375, 0.3153839111328125, 0.338043212890625, 0.3607025146484375, 0.38336181640625, 0.4060211181640625, 0.428680419921875, 0.4513397216796875, 0.4739990234375, 0.4966583251953125, 0.519317626953125, 0.5419769287109375, 0.56463623046875, 0.5872955322265625, 0.609954833984375, 0.6326141357421875, 0.6552734375]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 8.0, 3.0, 13.0, 17.0, 30.0, 46.0, 75.0, 152.0, 356.0, 884.0, 2851.0, 14760.0, 344134.0, 658290.0, 21598.0, 3485.0, 1017.0, 427.0, 163.0, 98.0, 47.0, 31.0, 10.0, 17.0, 9.0, 7.0, 7.0, 5.0, 10.0, 0.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.41064453125, -0.39490509033203125, -0.3791656494140625, -0.36342620849609375, -0.347686767578125, -0.33194732666015625, -0.3162078857421875, -0.30046844482421875, -0.28472900390625, -0.26898956298828125, -0.2532501220703125, -0.23751068115234375, -0.221771240234375, -0.20603179931640625, -0.1902923583984375, -0.17455291748046875, -0.1588134765625, -0.14307403564453125, -0.1273345947265625, -0.11159515380859375, -0.095855712890625, -0.08011627197265625, -0.0643768310546875, -0.04863739013671875, -0.03289794921875, -0.01715850830078125, -0.0014190673828125, 0.01432037353515625, 0.030059814453125, 0.04579925537109375, 0.0615386962890625, 0.07727813720703125, 0.093017578125, 0.10875701904296875, 0.1244964599609375, 0.14023590087890625, 0.155975341796875, 0.17171478271484375, 0.1874542236328125, 0.20319366455078125, 0.21893310546875, 0.23467254638671875, 0.2504119873046875, 0.26615142822265625, 0.281890869140625, 0.29763031005859375, 0.3133697509765625, 0.32910919189453125, 0.3448486328125, 0.36058807373046875, 0.3763275146484375, 0.39206695556640625, 0.407806396484375, 0.42354583740234375, 0.4392852783203125, 0.45502471923828125, 0.47076416015625, 0.48650360107421875, 0.5022430419921875, 0.5179824829101562, 0.533721923828125, 0.5494613647460938, 0.5652008056640625, 0.5809402465820312, 0.5966796875]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 4.0, 4.0, 2.0, 4.0, 2.0, 4.0, 8.0, 18.0, 10.0, 40.0, 47.0, 76.0, 102.0, 162.0, 157.0, 123.0, 79.0, 45.0, 46.0, 19.0, 14.0, 13.0, 9.0, 6.0, 7.0, 1.0, 5.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.106760025024414e-05, -3.943406045436859e-05, -3.780052065849304e-05, -3.616698086261749e-05, -3.453344106674194e-05, -3.2899901270866394e-05, -3.1266361474990845e-05, -2.9632821679115295e-05, -2.7999281883239746e-05, -2.6365742087364197e-05, -2.4732202291488647e-05, -2.3098662495613098e-05, -2.146512269973755e-05, -1.9831582903862e-05, -1.819804310798645e-05, -1.65645033121109e-05, -1.4930963516235352e-05, -1.3297423720359802e-05, -1.1663883924484253e-05, -1.0030344128608704e-05, -8.396804332733154e-06, -6.763264536857605e-06, -5.129724740982056e-06, -3.4961849451065063e-06, -1.862645149230957e-06, -2.2910535335540771e-07, 1.4044344425201416e-06, 3.037974238395691e-06, 4.67151403427124e-06, 6.3050538301467896e-06, 7.938593626022339e-06, 9.572133421897888e-06, 1.1205673217773438e-05, 1.2839213013648987e-05, 1.4472752809524536e-05, 1.6106292605400085e-05, 1.7739832401275635e-05, 1.9373372197151184e-05, 2.1006911993026733e-05, 2.2640451788902283e-05, 2.4273991584777832e-05, 2.590753138065338e-05, 2.754107117652893e-05, 2.917461097240448e-05, 3.080815076828003e-05, 3.244169056415558e-05, 3.407523036003113e-05, 3.570877015590668e-05, 3.7342309951782227e-05, 3.8975849747657776e-05, 4.0609389543533325e-05, 4.2242929339408875e-05, 4.3876469135284424e-05, 4.551000893115997e-05, 4.714354872703552e-05, 4.877708852291107e-05, 5.041062831878662e-05, 5.204416811466217e-05, 5.367770791053772e-05, 5.531124770641327e-05, 5.694478750228882e-05, 5.857832729816437e-05, 6.021186709403992e-05, 6.184540688991547e-05, 6.347894668579102e-05]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 6.0, 5.0, 4.0, 14.0, 19.0, 43.0, 77.0, 195.0, 602.0, 2852.0, 43139.0, 962127.0, 35944.0, 2577.0, 590.0, 203.0, 82.0, 39.0, 18.0, 12.0, 8.0, 4.0, 4.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.90478515625, -0.8824310302734375, -0.860076904296875, -0.8377227783203125, -0.81536865234375, -0.7930145263671875, -0.770660400390625, -0.7483062744140625, -0.7259521484375, -0.7035980224609375, -0.681243896484375, -0.6588897705078125, -0.63653564453125, -0.6141815185546875, -0.591827392578125, -0.5694732666015625, -0.547119140625, -0.5247650146484375, -0.502410888671875, -0.4800567626953125, -0.45770263671875, -0.4353485107421875, -0.412994384765625, -0.3906402587890625, -0.3682861328125, -0.3459320068359375, -0.323577880859375, -0.3012237548828125, -0.27886962890625, -0.2565155029296875, -0.234161376953125, -0.2118072509765625, -0.189453125, -0.1670989990234375, -0.144744873046875, -0.1223907470703125, -0.10003662109375, -0.0776824951171875, -0.055328369140625, -0.0329742431640625, -0.0106201171875, 0.0117340087890625, 0.034088134765625, 0.0564422607421875, 0.07879638671875, 0.1011505126953125, 0.123504638671875, 0.1458587646484375, 0.168212890625, 0.1905670166015625, 0.212921142578125, 0.2352752685546875, 0.25762939453125, 0.2799835205078125, 0.302337646484375, 0.3246917724609375, 0.3470458984375, 0.3694000244140625, 0.391754150390625, 0.4141082763671875, 0.43646240234375, 0.4588165283203125, 0.481170654296875, 0.5035247802734375, 0.52587890625]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 9.0, 9.0, 12.0, 27.0, 52.0, 86.0, 135.0, 207.0, 188.0, 116.0, 68.0, 34.0, 20.0, 12.0, 6.0, 9.0, 8.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.119873046875, -0.11352157592773438, -0.10717010498046875, -0.10081863403320312, -0.0944671630859375, -0.08811569213867188, -0.08176422119140625, -0.07541275024414062, -0.069061279296875, -0.06270980834960938, -0.05635833740234375, -0.050006866455078125, -0.0436553955078125, -0.037303924560546875, -0.03095245361328125, -0.024600982666015625, -0.01824951171875, -0.011898040771484375, -0.00554656982421875, 0.000804901123046875, 0.0071563720703125, 0.013507843017578125, 0.01985931396484375, 0.026210784912109375, 0.032562255859375, 0.038913726806640625, 0.04526519775390625, 0.051616668701171875, 0.0579681396484375, 0.06431961059570312, 0.07067108154296875, 0.07702255249023438, 0.0833740234375, 0.08972549438476562, 0.09607696533203125, 0.10242843627929688, 0.1087799072265625, 0.11513137817382812, 0.12148284912109375, 0.12783432006835938, 0.134185791015625, 0.14053726196289062, 0.14688873291015625, 0.15324020385742188, 0.1595916748046875, 0.16594314575195312, 0.17229461669921875, 0.17864608764648438, 0.18499755859375, 0.19134902954101562, 0.19770050048828125, 0.20405197143554688, 0.2104034423828125, 0.21675491333007812, 0.22310638427734375, 0.22945785522460938, 0.235809326171875, 0.24216079711914062, 0.24851226806640625, 0.2548637390136719, 0.2612152099609375, 0.2675666809082031, 0.27391815185546875, 0.2802696228027344, 0.28662109375]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 6.0, 16.0, 43.0, 98.0, 177.0, 241.0, 222.0, 109.0, 52.0, 30.0, 10.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3290119171142578, -1.2319542169570923, -1.1348965167999268, -1.0378386974334717, -0.9407809972763062, -0.8437232971191406, -0.7466655373573303, -0.64960777759552, -0.5525500774383545, -0.4554923474788666, -0.35843461751937866, -0.26137688755989075, -0.16431915760040283, -0.06726142764091492, 0.029796302318572998, 0.1268540620803833, 0.22391176223754883, 0.32096949219703674, 0.41802722215652466, 0.515084981918335, 0.6121426820755005, 0.709200382232666, 0.8062581419944763, 0.9033159017562866, 1.0003736019134521, 1.0974313020706177, 1.1944890022277832, 1.2915468215942383, 1.3886045217514038, 1.4856622219085693, 1.5827200412750244, 1.67977774143219, 1.7768354415893555, 1.873893141746521, 1.9709508419036865, 2.0680086612701416, 2.1650662422180176, 2.2621240615844727, 2.3591818809509277, 2.456239700317383, 2.553297281265259, 2.650355100631714, 2.74741268157959, 2.844470500946045, 2.9415283203125, 3.038585901260376, 3.135643720626831, 3.232701301574707, 3.329759120941162, 3.426816940307617, 3.523874521255493, 3.6209323406219482, 3.717989921569824, 3.8150477409362793, 3.9121055603027344, 4.0091633796691895, 4.1062211990356445, 4.2032790184021, 4.300336837768555, 4.397394180297852, 4.494451999664307, 4.591509819030762, 4.688567638397217, 4.785625457763672, 4.882682800292969]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 4.0, 7.0, 9.0, 10.0, 9.0, 11.0, 18.0, 23.0, 21.0, 28.0, 33.0, 41.0, 45.0, 42.0, 41.0, 43.0, 57.0, 50.0, 50.0, 34.0, 52.0, 50.0, 41.0, 38.0, 43.0, 27.0, 29.0, 25.0, 20.0, 16.0, 20.0, 6.0, 14.0, 14.0, 13.0, 3.0, 3.0, 5.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.309946894645691, -1.2691545486450195, -1.2283622026443481, -1.1875699758529663, -1.146777629852295, -1.1059852838516235, -1.0651929378509521, -1.0244007110595703, -0.9836083650588989, -0.9428160190582275, -0.9020237326622009, -0.8612313866615295, -0.8204391002655029, -0.7796467542648315, -0.7388544082641602, -0.6980621218681335, -0.6572697758674622, -0.6164774298667908, -0.5756851434707642, -0.5348927974700928, -0.49410051107406616, -0.4533081650733948, -0.4125158488750458, -0.3717235326766968, -0.3309312164783478, -0.2901389002799988, -0.24934658408164978, -0.2085542529821396, -0.1677619367837906, -0.1269696205854416, -0.0861772894859314, -0.0453849732875824, -0.0045926570892333984, 0.0361996628344059, 0.0769919827580452, 0.11778430640697479, 0.1585766226053238, 0.1993689388036728, 0.24016126990318298, 0.280953586101532, 0.321745902299881, 0.36253821849823, 0.403330534696579, 0.444122850894928, 0.48491519689559937, 0.525707483291626, 0.5664998292922974, 0.6072921752929688, 0.6480844616889954, 0.6888768076896667, 0.7296690940856934, 0.7704614400863647, 0.8112537264823914, 0.8520460724830627, 0.8928383588790894, 0.9336307048797607, 0.9744230508804321, 1.0152153968811035, 1.056007742881775, 1.0967999696731567, 1.1375923156738281, 1.1783846616744995, 1.219177007675171, 1.2599692344665527, 1.3007615804672241]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 3.0, 5.0, 5.0, 10.0, 7.0, 18.0, 15.0, 22.0, 32.0, 72.0, 108.0, 228.0, 462.0, 1021.0, 3003.0, 13824.0, 145568.0, 2609292.0, 1349423.0, 60258.0, 7634.0, 1918.0, 650.0, 305.0, 182.0, 86.0, 60.0, 21.0, 18.0, 13.0, 12.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.150390625, -1.1090850830078125, -1.067779541015625, -1.0264739990234375, -0.98516845703125, -0.9438629150390625, -0.902557373046875, -0.8612518310546875, -0.8199462890625, -0.7786407470703125, -0.737335205078125, -0.6960296630859375, -0.65472412109375, -0.6134185791015625, -0.572113037109375, -0.5308074951171875, -0.489501953125, -0.4481964111328125, -0.406890869140625, -0.3655853271484375, -0.32427978515625, -0.2829742431640625, -0.241668701171875, -0.2003631591796875, -0.1590576171875, -0.1177520751953125, -0.076446533203125, -0.0351409912109375, 0.00616455078125, 0.0474700927734375, 0.088775634765625, 0.1300811767578125, 0.17138671875, 0.2126922607421875, 0.253997802734375, 0.2953033447265625, 0.33660888671875, 0.3779144287109375, 0.419219970703125, 0.4605255126953125, 0.5018310546875, 0.5431365966796875, 0.584442138671875, 0.6257476806640625, 0.66705322265625, 0.7083587646484375, 0.749664306640625, 0.7909698486328125, 0.832275390625, 0.8735809326171875, 0.914886474609375, 0.9561920166015625, 0.99749755859375, 1.0388031005859375, 1.080108642578125, 1.1214141845703125, 1.1627197265625, 1.2040252685546875, 1.245330810546875, 1.2866363525390625, 1.32794189453125, 1.3692474365234375, 1.410552978515625, 1.4518585205078125, 1.4931640625]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 2.0, 5.0, 6.0, 7.0, 6.0, 20.0, 16.0, 13.0, 27.0, 30.0, 36.0, 34.0, 42.0, 34.0, 50.0, 52.0, 71.0, 72.0, 44.0, 61.0, 49.0, 56.0, 56.0, 38.0, 28.0, 31.0, 17.0, 15.0, 16.0, 14.0, 11.0, 11.0, 12.0, 9.0, 3.0, 3.0, 4.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53857421875, -0.5185165405273438, -0.4984588623046875, -0.47840118408203125, -0.458343505859375, -0.43828582763671875, -0.4182281494140625, -0.39817047119140625, -0.37811279296875, -0.35805511474609375, -0.3379974365234375, -0.31793975830078125, -0.297882080078125, -0.27782440185546875, -0.2577667236328125, -0.23770904541015625, -0.2176513671875, -0.19759368896484375, -0.1775360107421875, -0.15747833251953125, -0.137420654296875, -0.11736297607421875, -0.0973052978515625, -0.07724761962890625, -0.05718994140625, -0.03713226318359375, -0.0170745849609375, 0.00298309326171875, 0.023040771484375, 0.04309844970703125, 0.0631561279296875, 0.08321380615234375, 0.103271484375, 0.12332916259765625, 0.1433868408203125, 0.16344451904296875, 0.183502197265625, 0.20355987548828125, 0.2236175537109375, 0.24367523193359375, 0.26373291015625, 0.28379058837890625, 0.3038482666015625, 0.32390594482421875, 0.343963623046875, 0.36402130126953125, 0.3840789794921875, 0.40413665771484375, 0.4241943359375, 0.44425201416015625, 0.4643096923828125, 0.48436737060546875, 0.504425048828125, 0.5244827270507812, 0.5445404052734375, 0.5645980834960938, 0.58465576171875, 0.6047134399414062, 0.6247711181640625, 0.6448287963867188, 0.664886474609375, 0.6849441528320312, 0.7050018310546875, 0.7250595092773438, 0.7451171875]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 4.0, 4.0, 6.0, 10.0, 21.0, 53.0, 99.0, 195.0, 468.0, 2220.0, 41941.0, 4080995.0, 64738.0, 2561.0, 540.0, 219.0, 92.0, 51.0, 36.0, 22.0, 5.0, 4.0, 4.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.08203125, -2.99993896484375, -2.9178466796875, -2.83575439453125, -2.753662109375, -2.67156982421875, -2.5894775390625, -2.50738525390625, -2.42529296875, -2.34320068359375, -2.2611083984375, -2.17901611328125, -2.096923828125, -2.01483154296875, -1.9327392578125, -1.85064697265625, -1.7685546875, -1.68646240234375, -1.6043701171875, -1.52227783203125, -1.440185546875, -1.35809326171875, -1.2760009765625, -1.19390869140625, -1.11181640625, -1.02972412109375, -0.9476318359375, -0.86553955078125, -0.783447265625, -0.70135498046875, -0.6192626953125, -0.53717041015625, -0.455078125, -0.37298583984375, -0.2908935546875, -0.20880126953125, -0.126708984375, -0.04461669921875, 0.0374755859375, 0.11956787109375, 0.20166015625, 0.28375244140625, 0.3658447265625, 0.44793701171875, 0.530029296875, 0.61212158203125, 0.6942138671875, 0.77630615234375, 0.8583984375, 0.94049072265625, 1.0225830078125, 1.10467529296875, 1.186767578125, 1.26885986328125, 1.3509521484375, 1.43304443359375, 1.51513671875, 1.59722900390625, 1.6793212890625, 1.76141357421875, 1.843505859375, 1.92559814453125, 2.0076904296875, 2.08978271484375, 2.171875]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 4.0, 2.0, 7.0, 4.0, 10.0, 28.0, 22.0, 53.0, 63.0, 92.0, 151.0, 270.0, 423.0, 674.0, 745.0, 603.0, 348.0, 216.0, 122.0, 82.0, 45.0, 43.0, 25.0, 9.0, 10.0, 9.0, 2.0, 5.0, 2.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.289794921875, -0.2802391052246094, -0.27068328857421875, -0.2611274719238281, -0.2515716552734375, -0.24201583862304688, -0.23246002197265625, -0.22290420532226562, -0.213348388671875, -0.20379257202148438, -0.19423675537109375, -0.18468093872070312, -0.1751251220703125, -0.16556930541992188, -0.15601348876953125, -0.14645767211914062, -0.13690185546875, -0.12734603881835938, -0.11779022216796875, -0.10823440551757812, -0.0986785888671875, -0.08912277221679688, -0.07956695556640625, -0.07001113891601562, -0.060455322265625, -0.050899505615234375, -0.04134368896484375, -0.031787872314453125, -0.0222320556640625, -0.012676239013671875, -0.00312042236328125, 0.006435394287109375, 0.0159912109375, 0.025547027587890625, 0.03510284423828125, 0.044658660888671875, 0.0542144775390625, 0.06377029418945312, 0.07332611083984375, 0.08288192749023438, 0.092437744140625, 0.10199356079101562, 0.11154937744140625, 0.12110519409179688, 0.1306610107421875, 0.14021682739257812, 0.14977264404296875, 0.15932846069335938, 0.16888427734375, 0.17844009399414062, 0.18799591064453125, 0.19755172729492188, 0.2071075439453125, 0.21666336059570312, 0.22621917724609375, 0.23577499389648438, 0.245330810546875, 0.2548866271972656, 0.26444244384765625, 0.2739982604980469, 0.2835540771484375, 0.2931098937988281, 0.30266571044921875, 0.3122215270996094, 0.32177734375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 9.0, 9.0, 26.0, 37.0, 67.0, 77.0, 140.0, 142.0, 116.0, 109.0, 87.0, 72.0, 47.0, 28.0, 12.0, 10.0, 8.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6545131206512451, -1.6121437549591064, -1.5697743892669678, -1.527405023574829, -1.4850356578826904, -1.4426661729812622, -1.4002968072891235, -1.3579274415969849, -1.3155580759048462, -1.2731887102127075, -1.2308193445205688, -1.1884499788284302, -1.146080493927002, -1.1037111282348633, -1.0613417625427246, -1.018972396850586, -0.9766030311584473, -0.9342336654663086, -0.8918642997741699, -0.8494948744773865, -0.8071255087852478, -0.7647561430931091, -0.7223867177963257, -0.680017352104187, -0.6376479864120483, -0.5952786207199097, -0.552909255027771, -0.5105398297309875, -0.4681704640388489, -0.4258010983467102, -0.38343170285224915, -0.3410623073577881, -0.29869282245635986, -0.2563234567642212, -0.21395406126976013, -0.17158468067646027, -0.1292153000831604, -0.08684591948986053, -0.04447653889656067, -0.0021071434020996094, 0.04026222229003906, 0.08263160288333893, 0.1250009834766388, 0.16737036406993866, 0.20973974466323853, 0.2521091103553772, 0.29447850584983826, 0.3368479013442993, 0.379217267036438, 0.42158663272857666, 0.4639560282230377, 0.5063254237174988, 0.5486947894096375, 0.5910641551017761, 0.6334335803985596, 0.6758029460906982, 0.7181723117828369, 0.7605416774749756, 0.8029110431671143, 0.8452804684638977, 0.8876498341560364, 0.930019199848175, 0.9723886251449585, 1.0147579908370972, 1.0571273565292358]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 3.0, 5.0, 8.0, 3.0, 8.0, 9.0, 9.0, 20.0, 10.0, 24.0, 32.0, 33.0, 34.0, 43.0, 51.0, 45.0, 52.0, 51.0, 37.0, 45.0, 61.0, 46.0, 48.0, 34.0, 48.0, 28.0, 37.0, 30.0, 23.0, 15.0, 26.0, 19.0, 19.0, 12.0, 8.0, 8.0, 6.0, 4.0, 4.0, 4.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.6787095069885254, -0.6585495471954346, -0.638389527797699, -0.6182295680046082, -0.5980696082115173, -0.5779095888137817, -0.5577496290206909, -0.5375896692276001, -0.5174297094345093, -0.49726971983909607, -0.47710976004600525, -0.45694977045059204, -0.4367898106575012, -0.416629821062088, -0.3964698314666748, -0.376309871673584, -0.3561498522758484, -0.3359898626804352, -0.31582990288734436, -0.29566991329193115, -0.27550995349884033, -0.2553499639034271, -0.23518997430801392, -0.2150299996137619, -0.1948700249195099, -0.17471005022525787, -0.15455007553100586, -0.13439008593559265, -0.11423011124134064, -0.09407013654708862, -0.07391015440225601, -0.0537501722574234, -0.03359025716781616, -0.01343027874827385, 0.006729699671268463, 0.026889678090810776, 0.04704965651035309, 0.0672096312046051, 0.08736961334943771, 0.10752959549427032, 0.12768957018852234, 0.14784954488277435, 0.16800951957702637, 0.18816950917243958, 0.2083294838666916, 0.2284894585609436, 0.2486494481563568, 0.26880943775177, 0.28896939754486084, 0.30912938714027405, 0.32928934693336487, 0.3494493365287781, 0.3696092963218689, 0.3897692859172821, 0.4099292755126953, 0.43008923530578613, 0.45024922490119934, 0.47040921449661255, 0.49056917428970337, 0.5107291340827942, 0.5308891534805298, 0.5510491132736206, 0.5712090730667114, 0.591369092464447, 0.6115290522575378]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 5.0, 7.0, 7.0, 12.0, 16.0, 19.0, 32.0, 47.0, 84.0, 141.0, 368.0, 783.0, 1810.0, 5224.0, 17306.0, 71349.0, 344864.0, 460338.0, 110064.0, 24613.0, 7204.0, 2453.0, 985.0, 380.0, 183.0, 99.0, 52.0, 32.0, 17.0, 13.0, 10.0, 9.0, 9.0, 5.0, 4.0, 5.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.176025390625, -0.169769287109375, -0.16351318359375, -0.157257080078125, -0.1510009765625, -0.144744873046875, -0.13848876953125, -0.132232666015625, -0.1259765625, -0.119720458984375, -0.11346435546875, -0.107208251953125, -0.1009521484375, -0.094696044921875, -0.08843994140625, -0.082183837890625, -0.075927734375, -0.069671630859375, -0.06341552734375, -0.057159423828125, -0.0509033203125, -0.044647216796875, -0.03839111328125, -0.032135009765625, -0.02587890625, -0.019622802734375, -0.01336669921875, -0.007110595703125, -0.0008544921875, 0.005401611328125, 0.01165771484375, 0.017913818359375, 0.024169921875, 0.030426025390625, 0.03668212890625, 0.042938232421875, 0.0491943359375, 0.055450439453125, 0.06170654296875, 0.067962646484375, 0.07421875, 0.080474853515625, 0.08673095703125, 0.092987060546875, 0.0992431640625, 0.105499267578125, 0.11175537109375, 0.118011474609375, 0.124267578125, 0.130523681640625, 0.13677978515625, 0.143035888671875, 0.1492919921875, 0.155548095703125, 0.16180419921875, 0.168060302734375, 0.17431640625, 0.180572509765625, 0.18682861328125, 0.193084716796875, 0.1993408203125, 0.205596923828125, 0.21185302734375, 0.218109130859375, 0.224365234375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 7.0, 6.0, 6.0, 5.0, 7.0, 8.0, 9.0, 20.0, 21.0, 27.0, 30.0, 32.0, 32.0, 47.0, 56.0, 56.0, 59.0, 45.0, 61.0, 55.0, 60.0, 41.0, 44.0, 45.0, 35.0, 27.0, 32.0, 30.0, 16.0, 20.0, 18.0, 11.0, 10.0, 6.0, 4.0, 4.0, 2.0, 1.0, 4.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.50146484375, -0.4869537353515625, -0.472442626953125, -0.4579315185546875, -0.44342041015625, -0.4289093017578125, -0.414398193359375, -0.3998870849609375, -0.3853759765625, -0.3708648681640625, -0.356353759765625, -0.3418426513671875, -0.32733154296875, -0.3128204345703125, -0.298309326171875, -0.2837982177734375, -0.269287109375, -0.2547760009765625, -0.240264892578125, -0.2257537841796875, -0.21124267578125, -0.1967315673828125, -0.182220458984375, -0.1677093505859375, -0.1531982421875, -0.1386871337890625, -0.124176025390625, -0.1096649169921875, -0.09515380859375, -0.0806427001953125, -0.066131591796875, -0.0516204833984375, -0.037109375, -0.0225982666015625, -0.008087158203125, 0.0064239501953125, 0.02093505859375, 0.0354461669921875, 0.049957275390625, 0.0644683837890625, 0.0789794921875, 0.0934906005859375, 0.108001708984375, 0.1225128173828125, 0.13702392578125, 0.1515350341796875, 0.166046142578125, 0.1805572509765625, 0.195068359375, 0.2095794677734375, 0.224090576171875, 0.2386016845703125, 0.25311279296875, 0.2676239013671875, 0.282135009765625, 0.2966461181640625, 0.3111572265625, 0.3256683349609375, 0.340179443359375, 0.3546905517578125, 0.36920166015625, 0.3837127685546875, 0.398223876953125, 0.4127349853515625, 0.42724609375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 2.0, 2.0, 1.0, 4.0, 6.0, 4.0, 7.0, 16.0, 28.0, 26.0, 34.0, 58.0, 98.0, 163.0, 233.0, 400.0, 715.0, 1184.0, 2348.0, 4990.0, 11864.0, 30611.0, 86475.0, 228827.0, 350043.0, 205630.0, 76733.0, 27539.0, 10845.0, 4670.0, 2147.0, 1138.0, 669.0, 361.0, 270.0, 133.0, 110.0, 57.0, 45.0, 23.0, 16.0, 11.0, 8.0, 6.0, 8.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.1441650390625, -0.14020919799804688, -0.13625335693359375, -0.13229751586914062, -0.1283416748046875, -0.12438583374023438, -0.12042999267578125, -0.11647415161132812, -0.112518310546875, -0.10856246948242188, -0.10460662841796875, -0.10065078735351562, -0.0966949462890625, -0.09273910522460938, -0.08878326416015625, -0.08482742309570312, -0.08087158203125, -0.07691574096679688, -0.07295989990234375, -0.06900405883789062, -0.0650482177734375, -0.061092376708984375, -0.05713653564453125, -0.053180694580078125, -0.049224853515625, -0.045269012451171875, -0.04131317138671875, -0.037357330322265625, -0.0334014892578125, -0.029445648193359375, -0.02548980712890625, -0.021533966064453125, -0.017578125, -0.013622283935546875, -0.00966644287109375, -0.005710601806640625, -0.0017547607421875, 0.002201080322265625, 0.00615692138671875, 0.010112762451171875, 0.014068603515625, 0.018024444580078125, 0.02198028564453125, 0.025936126708984375, 0.0298919677734375, 0.033847808837890625, 0.03780364990234375, 0.041759490966796875, 0.04571533203125, 0.049671173095703125, 0.05362701416015625, 0.057582855224609375, 0.0615386962890625, 0.06549453735351562, 0.06945037841796875, 0.07340621948242188, 0.077362060546875, 0.08131790161132812, 0.08527374267578125, 0.08922958374023438, 0.0931854248046875, 0.09714126586914062, 0.10109710693359375, 0.10505294799804688, 0.1090087890625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 5.0, 3.0, 11.0, 10.0, 4.0, 13.0, 20.0, 20.0, 28.0, 22.0, 33.0, 38.0, 51.0, 44.0, 42.0, 41.0, 47.0, 46.0, 66.0, 49.0, 60.0, 54.0, 41.0, 31.0, 35.0, 36.0, 30.0, 27.0, 22.0, 12.0, 14.0, 6.0, 9.0, 9.0, 4.0, 6.0, 5.0, 6.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.708984375, -0.681121826171875, -0.65325927734375, -0.625396728515625, -0.5975341796875, -0.569671630859375, -0.54180908203125, -0.513946533203125, -0.486083984375, -0.458221435546875, -0.43035888671875, -0.402496337890625, -0.3746337890625, -0.346771240234375, -0.31890869140625, -0.291046142578125, -0.26318359375, -0.235321044921875, -0.20745849609375, -0.179595947265625, -0.1517333984375, -0.123870849609375, -0.09600830078125, -0.068145751953125, -0.040283203125, -0.012420654296875, 0.01544189453125, 0.043304443359375, 0.0711669921875, 0.099029541015625, 0.12689208984375, 0.154754638671875, 0.1826171875, 0.210479736328125, 0.23834228515625, 0.266204833984375, 0.2940673828125, 0.321929931640625, 0.34979248046875, 0.377655029296875, 0.405517578125, 0.433380126953125, 0.46124267578125, 0.489105224609375, 0.5169677734375, 0.544830322265625, 0.57269287109375, 0.600555419921875, 0.62841796875, 0.656280517578125, 0.68414306640625, 0.712005615234375, 0.7398681640625, 0.767730712890625, 0.79559326171875, 0.823455810546875, 0.851318359375, 0.879180908203125, 0.90704345703125, 0.934906005859375, 0.9627685546875, 0.990631103515625, 1.01849365234375, 1.046356201171875, 1.07421875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 1.0, 1.0, 0.0, 2.0, 2.0, 14.0, 9.0, 10.0, 25.0, 41.0, 53.0, 102.0, 176.0, 309.0, 642.0, 1189.0, 2715.0, 6290.0, 17421.0, 58963.0, 238408.0, 471000.0, 181741.0, 45613.0, 14021.0, 5189.0, 2342.0, 1074.0, 502.0, 287.0, 163.0, 91.0, 64.0, 32.0, 19.0, 14.0, 12.0, 11.0, 4.0, 2.0, 2.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05316162109375, -0.05152082443237305, -0.049880027770996094, -0.04823923110961914, -0.04659843444824219, -0.044957637786865234, -0.04331684112548828, -0.04167604446411133, -0.040035247802734375, -0.03839445114135742, -0.03675365447998047, -0.035112857818603516, -0.03347206115722656, -0.03183126449584961, -0.030190467834472656, -0.028549671173095703, -0.02690887451171875, -0.025268077850341797, -0.023627281188964844, -0.02198648452758789, -0.020345687866210938, -0.018704891204833984, -0.01706409454345703, -0.015423297882080078, -0.013782501220703125, -0.012141704559326172, -0.010500907897949219, -0.008860111236572266, -0.0072193145751953125, -0.005578517913818359, -0.003937721252441406, -0.002296924591064453, -0.0006561279296875, 0.0009846687316894531, 0.0026254653930664062, 0.004266262054443359, 0.0059070587158203125, 0.007547855377197266, 0.009188652038574219, 0.010829448699951172, 0.012470245361328125, 0.014111042022705078, 0.01575183868408203, 0.017392635345458984, 0.019033432006835938, 0.02067422866821289, 0.022315025329589844, 0.023955821990966797, 0.02559661865234375, 0.027237415313720703, 0.028878211975097656, 0.03051900863647461, 0.03215980529785156, 0.033800601959228516, 0.03544139862060547, 0.03708219528198242, 0.038722991943359375, 0.04036378860473633, 0.04200458526611328, 0.043645381927490234, 0.04528617858886719, 0.04692697525024414, 0.048567771911621094, 0.05020856857299805, 0.051849365234375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 5.0, 7.0, 3.0, 16.0, 12.0, 24.0, 43.0, 55.0, 77.0, 99.0, 126.0, 134.0, 115.0, 88.0, 58.0, 45.0, 21.0, 17.0, 17.0, 17.0, 7.0, 4.0, 1.0, 2.0, 3.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0517578125e-05, -2.9309652745723724e-05, -2.810172736644745e-05, -2.6893801987171173e-05, -2.5685876607894897e-05, -2.4477951228618622e-05, -2.3270025849342346e-05, -2.206210047006607e-05, -2.0854175090789795e-05, -1.964624971151352e-05, -1.8438324332237244e-05, -1.7230398952960968e-05, -1.6022473573684692e-05, -1.4814548194408417e-05, -1.3606622815132141e-05, -1.2398697435855865e-05, -1.119077205657959e-05, -9.982846677303314e-06, -8.774921298027039e-06, -7.566995918750763e-06, -6.359070539474487e-06, -5.151145160198212e-06, -3.943219780921936e-06, -2.7352944016456604e-06, -1.5273690223693848e-06, -3.1944364309310913e-07, 8.884817361831665e-07, 2.096407115459442e-06, 3.3043324947357178e-06, 4.512257874011993e-06, 5.720183253288269e-06, 6.928108632564545e-06, 8.13603401184082e-06, 9.343959391117096e-06, 1.0551884770393372e-05, 1.1759810149669647e-05, 1.2967735528945923e-05, 1.4175660908222198e-05, 1.5383586287498474e-05, 1.659151166677475e-05, 1.7799437046051025e-05, 1.90073624253273e-05, 2.0215287804603577e-05, 2.1423213183879852e-05, 2.2631138563156128e-05, 2.3839063942432404e-05, 2.504698932170868e-05, 2.6254914700984955e-05, 2.746284008026123e-05, 2.8670765459537506e-05, 2.9878690838813782e-05, 3.108661621809006e-05, 3.229454159736633e-05, 3.350246697664261e-05, 3.4710392355918884e-05, 3.591831773519516e-05, 3.7126243114471436e-05, 3.833416849374771e-05, 3.954209387302399e-05, 4.075001925230026e-05, 4.195794463157654e-05, 4.3165870010852814e-05, 4.437379539012909e-05, 4.5581720769405365e-05, 4.678964614868164e-05]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 3.0, 4.0, 5.0, 5.0, 8.0, 9.0, 17.0, 22.0, 22.0, 36.0, 65.0, 100.0, 180.0, 266.0, 539.0, 1133.0, 2775.0, 7354.0, 22518.0, 83909.0, 295614.0, 414596.0, 158020.0, 41004.0, 12470.0, 4509.0, 1681.0, 759.0, 389.0, 196.0, 124.0, 70.0, 52.0, 31.0, 23.0, 17.0, 13.0, 11.0, 3.0, 5.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.049591064453125, -0.048142433166503906, -0.04669380187988281, -0.04524517059326172, -0.043796539306640625, -0.04234790802001953, -0.04089927673339844, -0.039450645446777344, -0.03800201416015625, -0.036553382873535156, -0.03510475158691406, -0.03365612030029297, -0.032207489013671875, -0.03075885772705078, -0.029310226440429688, -0.027861595153808594, -0.0264129638671875, -0.024964332580566406, -0.023515701293945312, -0.02206707000732422, -0.020618438720703125, -0.01916980743408203, -0.017721176147460938, -0.016272544860839844, -0.01482391357421875, -0.013375282287597656, -0.011926651000976562, -0.010478019714355469, -0.009029388427734375, -0.007580757141113281, -0.0061321258544921875, -0.004683494567871094, -0.00323486328125, -0.0017862319946289062, -0.0003376007080078125, 0.0011110305786132812, 0.002559661865234375, 0.004008293151855469, 0.0054569244384765625, 0.006905555725097656, 0.00835418701171875, 0.009802818298339844, 0.011251449584960938, 0.012700080871582031, 0.014148712158203125, 0.015597343444824219, 0.017045974731445312, 0.018494606018066406, 0.0199432373046875, 0.021391868591308594, 0.022840499877929688, 0.02428913116455078, 0.025737762451171875, 0.02718639373779297, 0.028635025024414062, 0.030083656311035156, 0.03153228759765625, 0.032980918884277344, 0.03442955017089844, 0.03587818145751953, 0.037326812744140625, 0.03877544403076172, 0.04022407531738281, 0.041672706604003906, 0.043121337890625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 3.0, 4.0, 6.0, 10.0, 7.0, 10.0, 9.0, 21.0, 19.0, 31.0, 32.0, 37.0, 38.0, 45.0, 55.0, 62.0, 57.0, 64.0, 57.0, 57.0, 38.0, 58.0, 58.0, 28.0, 41.0, 28.0, 24.0, 19.0, 12.0, 12.0, 12.0, 9.0, 9.0, 5.0, 9.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.0112457275390625, -0.010927438735961914, -0.010609149932861328, -0.010290861129760742, -0.009972572326660156, -0.00965428352355957, -0.009335994720458984, -0.009017705917358398, -0.008699417114257812, -0.008381128311157227, -0.00806283950805664, -0.007744550704956055, -0.007426261901855469, -0.007107973098754883, -0.006789684295654297, -0.006471395492553711, -0.006153106689453125, -0.005834817886352539, -0.005516529083251953, -0.005198240280151367, -0.004879951477050781, -0.004561662673950195, -0.004243373870849609, -0.0039250850677490234, -0.0036067962646484375, -0.0032885074615478516, -0.0029702186584472656, -0.0026519298553466797, -0.0023336410522460938, -0.002015352249145508, -0.0016970634460449219, -0.001378774642944336, -0.00106048583984375, -0.0007421970367431641, -0.0004239082336425781, -0.00010561943054199219, 0.00021266937255859375, 0.0005309581756591797, 0.0008492469787597656, 0.0011675357818603516, 0.0014858245849609375, 0.0018041133880615234, 0.0021224021911621094, 0.0024406909942626953, 0.0027589797973632812, 0.003077268600463867, 0.003395557403564453, 0.003713846206665039, 0.004032135009765625, 0.004350423812866211, 0.004668712615966797, 0.004987001419067383, 0.005305290222167969, 0.005623579025268555, 0.005941867828369141, 0.0062601566314697266, 0.0065784454345703125, 0.0068967342376708984, 0.007215023040771484, 0.00753331184387207, 0.007851600646972656, 0.008169889450073242, 0.008488178253173828, 0.008806467056274414, 0.009124755859375]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 12.0, 53.0, 245.0, 410.0, 221.0, 51.0, 16.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.242868900299072, -4.16200065612793, -4.081132411956787, -4.000264644622803, -3.91939640045166, -3.8385281562805176, -3.757659912109375, -3.6767919063568115, -3.595923662185669, -3.5150554180145264, -3.434187412261963, -3.3533191680908203, -3.272451162338257, -3.1915829181671143, -3.110714912414551, -3.029846668243408, -2.9489784240722656, -2.868110179901123, -2.7872421741485596, -2.706373929977417, -2.6255059242248535, -2.544637680053711, -2.4637694358825684, -2.382901430130005, -2.3020334243774414, -2.221165180206299, -2.1402971744537354, -2.0594289302825928, -1.9785608053207397, -1.8976926803588867, -1.8168245553970337, -1.7359564304351807, -1.655088186264038, -1.574220061302185, -1.493351936340332, -1.4124836921691895, -1.3316155672073364, -1.2507474422454834, -1.1698793172836304, -1.0890111923217773, -1.0081429481506348, -0.9272748231887817, -0.8464066386222839, -0.7655385136604309, -0.6846703290939331, -0.6038022041320801, -0.522934079170227, -0.44206589460372925, -0.3611977696418762, -0.2803296148777008, -0.19946147501468658, -0.11859333515167236, -0.03772518038749695, 0.04314297437667847, 0.1240110993385315, 0.2048792839050293, 0.2857474088668823, 0.36661556363105774, 0.44748371839523315, 0.5283518433570862, 0.609220027923584, 0.690088152885437, 0.77095627784729, 0.8518244624137878, 0.9326925873756409]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 4.0, 2.0, 6.0, 6.0, 9.0, 12.0, 9.0, 13.0, 20.0, 32.0, 34.0, 26.0, 40.0, 47.0, 63.0, 54.0, 48.0, 44.0, 59.0, 55.0, 48.0, 58.0, 45.0, 36.0, 30.0, 36.0, 26.0, 22.0, 26.0, 22.0, 17.0, 14.0, 6.0, 8.0, 7.0, 3.0, 5.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.461410790681839, -0.4476940631866455, -0.43397730588912964, -0.42026054859161377, -0.4065438210964203, -0.3928270936012268, -0.37911033630371094, -0.36539357900619507, -0.3516768515110016, -0.3379601240158081, -0.32424336671829224, -0.31052660942077637, -0.2968098819255829, -0.2830931544303894, -0.26937639713287354, -0.25565963983535767, -0.24194291234016418, -0.2282261699438095, -0.21450942754745483, -0.20079268515110016, -0.18707594275474548, -0.1733592003583908, -0.15964245796203613, -0.14592571556568146, -0.13220897316932678, -0.1184922307729721, -0.10477548837661743, -0.09105874598026276, -0.07734200358390808, -0.0636252611875534, -0.04990851879119873, -0.036191776394844055, -0.022475063800811768, -0.008758321404457092, 0.004958420991897583, 0.01867516338825226, 0.032391905784606934, 0.04610864818096161, 0.059825390577316284, 0.07354213297367096, 0.08725887537002563, 0.10097561776638031, 0.11469236016273499, 0.12840910255908966, 0.14212584495544434, 0.155842587351799, 0.1695593297481537, 0.18327607214450836, 0.19699281454086304, 0.2107095569372177, 0.2244262993335724, 0.23814304172992706, 0.25185978412628174, 0.2655765414237976, 0.2792932689189911, 0.29300999641418457, 0.30672675371170044, 0.3204435110092163, 0.3341602385044098, 0.34787696599960327, 0.36159372329711914, 0.375310480594635, 0.3890272080898285, 0.402743935585022, 0.41646069288253784]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 7.0, 11.0, 9.0, 8.0, 21.0, 31.0, 32.0, 69.0, 226.0, 1107.0, 9429.0, 235972.0, 766225.0, 32117.0, 2619.0, 426.0, 121.0, 46.0, 22.0, 16.0, 4.0, 11.0, 7.0, 9.0, 3.0, 3.0, 3.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6484375, -1.6029205322265625, -1.557403564453125, -1.5118865966796875, -1.46636962890625, -1.4208526611328125, -1.375335693359375, -1.3298187255859375, -1.2843017578125, -1.2387847900390625, -1.193267822265625, -1.1477508544921875, -1.10223388671875, -1.0567169189453125, -1.011199951171875, -0.9656829833984375, -0.920166015625, -0.8746490478515625, -0.829132080078125, -0.7836151123046875, -0.73809814453125, -0.6925811767578125, -0.647064208984375, -0.6015472412109375, -0.5560302734375, -0.5105133056640625, -0.464996337890625, -0.4194793701171875, -0.37396240234375, -0.3284454345703125, -0.282928466796875, -0.2374114990234375, -0.19189453125, -0.1463775634765625, -0.100860595703125, -0.0553436279296875, -0.00982666015625, 0.0356903076171875, 0.081207275390625, 0.1267242431640625, 0.1722412109375, 0.2177581787109375, 0.263275146484375, 0.3087921142578125, 0.35430908203125, 0.3998260498046875, 0.445343017578125, 0.4908599853515625, 0.536376953125, 0.5818939208984375, 0.627410888671875, 0.6729278564453125, 0.71844482421875, 0.7639617919921875, 0.809478759765625, 0.8549957275390625, 0.9005126953125, 0.9460296630859375, 0.991546630859375, 1.0370635986328125, 1.08258056640625, 1.1280975341796875, 1.173614501953125, 1.2191314697265625, 1.2646484375]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 8.0, 8.0, 13.0, 19.0, 28.0, 25.0, 43.0, 48.0, 65.0, 72.0, 87.0, 78.0, 80.0, 80.0, 70.0, 62.0, 49.0, 41.0, 26.0, 34.0, 19.0, 18.0, 7.0, 10.0, 4.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.796875, -0.7592010498046875, -0.721527099609375, -0.6838531494140625, -0.64617919921875, -0.6085052490234375, -0.570831298828125, -0.5331573486328125, -0.4954833984375, -0.4578094482421875, -0.420135498046875, -0.3824615478515625, -0.34478759765625, -0.3071136474609375, -0.269439697265625, -0.2317657470703125, -0.194091796875, -0.1564178466796875, -0.118743896484375, -0.0810699462890625, -0.04339599609375, -0.0057220458984375, 0.031951904296875, 0.0696258544921875, 0.1072998046875, 0.1449737548828125, 0.182647705078125, 0.2203216552734375, 0.25799560546875, 0.2956695556640625, 0.333343505859375, 0.3710174560546875, 0.40869140625, 0.4463653564453125, 0.484039306640625, 0.5217132568359375, 0.55938720703125, 0.5970611572265625, 0.634735107421875, 0.6724090576171875, 0.7100830078125, 0.7477569580078125, 0.785430908203125, 0.8231048583984375, 0.86077880859375, 0.8984527587890625, 0.936126708984375, 0.9738006591796875, 1.011474609375, 1.0491485595703125, 1.086822509765625, 1.1244964599609375, 1.16217041015625, 1.1998443603515625, 1.237518310546875, 1.2751922607421875, 1.3128662109375, 1.3505401611328125, 1.388214111328125, 1.4258880615234375, 1.46356201171875, 1.5012359619140625, 1.538909912109375, 1.5765838623046875, 1.6142578125]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 5.0, 8.0, 6.0, 8.0, 6.0, 13.0, 13.0, 19.0, 32.0, 36.0, 45.0, 56.0, 72.0, 106.0, 129.0, 191.0, 242.0, 454.0, 1298.0, 7104.0, 123252.0, 838155.0, 69758.0, 5184.0, 1063.0, 389.0, 226.0, 156.0, 115.0, 88.0, 59.0, 54.0, 43.0, 32.0, 32.0, 25.0, 18.0, 25.0, 9.0, 9.0, 6.0, 2.0, 4.0, 4.0, 5.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.068359375, -1.033233642578125, -0.99810791015625, -0.962982177734375, -0.9278564453125, -0.892730712890625, -0.85760498046875, -0.822479248046875, -0.787353515625, -0.752227783203125, -0.71710205078125, -0.681976318359375, -0.6468505859375, -0.611724853515625, -0.57659912109375, -0.541473388671875, -0.50634765625, -0.471221923828125, -0.43609619140625, -0.400970458984375, -0.3658447265625, -0.330718994140625, -0.29559326171875, -0.260467529296875, -0.225341796875, -0.190216064453125, -0.15509033203125, -0.119964599609375, -0.0848388671875, -0.049713134765625, -0.01458740234375, 0.020538330078125, 0.0556640625, 0.090789794921875, 0.12591552734375, 0.161041259765625, 0.1961669921875, 0.231292724609375, 0.26641845703125, 0.301544189453125, 0.336669921875, 0.371795654296875, 0.40692138671875, 0.442047119140625, 0.4771728515625, 0.512298583984375, 0.54742431640625, 0.582550048828125, 0.61767578125, 0.652801513671875, 0.68792724609375, 0.723052978515625, 0.7581787109375, 0.793304443359375, 0.82843017578125, 0.863555908203125, 0.898681640625, 0.933807373046875, 0.96893310546875, 1.004058837890625, 1.0391845703125, 1.074310302734375, 1.10943603515625, 1.144561767578125, 1.1796875]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 4.0, 9.0, 9.0, 17.0, 9.0, 16.0, 14.0, 25.0, 21.0, 22.0, 34.0, 41.0, 42.0, 34.0, 41.0, 50.0, 55.0, 52.0, 32.0, 44.0, 53.0, 36.0, 41.0, 30.0, 38.0, 24.0, 26.0, 33.0, 22.0, 21.0, 21.0, 13.0, 18.0, 10.0, 13.0, 4.0, 10.0, 7.0, 1.0, 2.0, 6.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6279296875, -0.605072021484375, -0.58221435546875, -0.559356689453125, -0.5364990234375, -0.513641357421875, -0.49078369140625, -0.467926025390625, -0.445068359375, -0.422210693359375, -0.39935302734375, -0.376495361328125, -0.3536376953125, -0.330780029296875, -0.30792236328125, -0.285064697265625, -0.26220703125, -0.239349365234375, -0.21649169921875, -0.193634033203125, -0.1707763671875, -0.147918701171875, -0.12506103515625, -0.102203369140625, -0.079345703125, -0.056488037109375, -0.03363037109375, -0.010772705078125, 0.0120849609375, 0.034942626953125, 0.05780029296875, 0.080657958984375, 0.103515625, 0.126373291015625, 0.14923095703125, 0.172088623046875, 0.1949462890625, 0.217803955078125, 0.24066162109375, 0.263519287109375, 0.286376953125, 0.309234619140625, 0.33209228515625, 0.354949951171875, 0.3778076171875, 0.400665283203125, 0.42352294921875, 0.446380615234375, 0.46923828125, 0.492095947265625, 0.51495361328125, 0.537811279296875, 0.5606689453125, 0.583526611328125, 0.60638427734375, 0.629241943359375, 0.652099609375, 0.674957275390625, 0.69781494140625, 0.720672607421875, 0.7435302734375, 0.766387939453125, 0.78924560546875, 0.812103271484375, 0.8349609375]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 8.0, 7.0, 13.0, 22.0, 25.0, 70.0, 130.0, 324.0, 1009.0, 4993.0, 70778.0, 922826.0, 43090.0, 3884.0, 843.0, 275.0, 116.0, 55.0, 29.0, 20.0, 13.0, 14.0, 6.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3740234375, -0.358062744140625, -0.34210205078125, -0.326141357421875, -0.3101806640625, -0.294219970703125, -0.27825927734375, -0.262298583984375, -0.246337890625, -0.230377197265625, -0.21441650390625, -0.198455810546875, -0.1824951171875, -0.166534423828125, -0.15057373046875, -0.134613037109375, -0.11865234375, -0.102691650390625, -0.08673095703125, -0.070770263671875, -0.0548095703125, -0.038848876953125, -0.02288818359375, -0.006927490234375, 0.009033203125, 0.024993896484375, 0.04095458984375, 0.056915283203125, 0.0728759765625, 0.088836669921875, 0.10479736328125, 0.120758056640625, 0.13671875, 0.152679443359375, 0.16864013671875, 0.184600830078125, 0.2005615234375, 0.216522216796875, 0.23248291015625, 0.248443603515625, 0.264404296875, 0.280364990234375, 0.29632568359375, 0.312286376953125, 0.3282470703125, 0.344207763671875, 0.36016845703125, 0.376129150390625, 0.39208984375, 0.408050537109375, 0.42401123046875, 0.439971923828125, 0.4559326171875, 0.471893310546875, 0.48785400390625, 0.503814697265625, 0.519775390625, 0.535736083984375, 0.55169677734375, 0.567657470703125, 0.5836181640625, 0.599578857421875, 0.61553955078125, 0.631500244140625, 0.6474609375]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 5.0, 2.0, 7.0, 4.0, 2.0, 12.0, 14.0, 23.0, 31.0, 59.0, 66.0, 96.0, 120.0, 110.0, 119.0, 83.0, 81.0, 47.0, 36.0, 22.0, 12.0, 19.0, 12.0, 9.0, 3.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.017353057861328e-05, -3.9013102650642395e-05, -3.785267472267151e-05, -3.669224679470062e-05, -3.5531818866729736e-05, -3.437139093875885e-05, -3.3210963010787964e-05, -3.205053508281708e-05, -3.089010715484619e-05, -2.9729679226875305e-05, -2.856925129890442e-05, -2.7408823370933533e-05, -2.6248395442962646e-05, -2.508796751499176e-05, -2.3927539587020874e-05, -2.2767111659049988e-05, -2.16066837310791e-05, -2.0446255803108215e-05, -1.928582787513733e-05, -1.8125399947166443e-05, -1.6964972019195557e-05, -1.580454409122467e-05, -1.4644116163253784e-05, -1.3483688235282898e-05, -1.2323260307312012e-05, -1.1162832379341125e-05, -1.000240445137024e-05, -8.841976523399353e-06, -7.681548595428467e-06, -6.5211206674575806e-06, -5.360692739486694e-06, -4.200264811515808e-06, -3.039836883544922e-06, -1.8794089555740356e-06, -7.189810276031494e-07, 4.414469003677368e-07, 1.601874828338623e-06, 2.7623027563095093e-06, 3.9227306842803955e-06, 5.083158612251282e-06, 6.243586540222168e-06, 7.404014468193054e-06, 8.56444239616394e-06, 9.724870324134827e-06, 1.0885298252105713e-05, 1.2045726180076599e-05, 1.3206154108047485e-05, 1.4366582036018372e-05, 1.5527009963989258e-05, 1.6687437891960144e-05, 1.784786581993103e-05, 1.9008293747901917e-05, 2.0168721675872803e-05, 2.132914960384369e-05, 2.2489577531814575e-05, 2.365000545978546e-05, 2.4810433387756348e-05, 2.5970861315727234e-05, 2.713128924369812e-05, 2.8291717171669006e-05, 2.9452145099639893e-05, 3.061257302761078e-05, 3.1773000955581665e-05, 3.293342888355255e-05, 3.409385681152344e-05]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 4.0, 4.0, 5.0, 11.0, 17.0, 22.0, 28.0, 59.0, 96.0, 182.0, 450.0, 1599.0, 9436.0, 234707.0, 775117.0, 22754.0, 2836.0, 682.0, 255.0, 115.0, 62.0, 36.0, 31.0, 14.0, 7.0, 7.0, 4.0, 3.0, 8.0, 1.0, 0.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.46630859375, -0.45085906982421875, -0.4354095458984375, -0.41996002197265625, -0.404510498046875, -0.38906097412109375, -0.3736114501953125, -0.35816192626953125, -0.34271240234375, -0.32726287841796875, -0.3118133544921875, -0.29636383056640625, -0.280914306640625, -0.26546478271484375, -0.2500152587890625, -0.23456573486328125, -0.2191162109375, -0.20366668701171875, -0.1882171630859375, -0.17276763916015625, -0.157318115234375, -0.14186859130859375, -0.1264190673828125, -0.11096954345703125, -0.09552001953125, -0.08007049560546875, -0.0646209716796875, -0.04917144775390625, -0.033721923828125, -0.01827239990234375, -0.0028228759765625, 0.01262664794921875, 0.028076171875, 0.04352569580078125, 0.0589752197265625, 0.07442474365234375, 0.089874267578125, 0.10532379150390625, 0.1207733154296875, 0.13622283935546875, 0.15167236328125, 0.16712188720703125, 0.1825714111328125, 0.19802093505859375, 0.213470458984375, 0.22891998291015625, 0.2443695068359375, 0.25981903076171875, 0.2752685546875, 0.29071807861328125, 0.3061676025390625, 0.32161712646484375, 0.337066650390625, 0.35251617431640625, 0.3679656982421875, 0.38341522216796875, 0.39886474609375, 0.41431427001953125, 0.4297637939453125, 0.44521331787109375, 0.460662841796875, 0.47611236572265625, 0.4915618896484375, 0.5070114135742188, 0.5224609375]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 4.0, 2.0, 1.0, 2.0, 4.0, 5.0, 7.0, 6.0, 15.0, 12.0, 21.0, 49.0, 51.0, 63.0, 91.0, 113.0, 134.0, 112.0, 90.0, 62.0, 56.0, 27.0, 24.0, 20.0, 13.0, 5.0, 6.0, 4.0, 7.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12237548828125, -0.11870670318603516, -0.11503791809082031, -0.11136913299560547, -0.10770034790039062, -0.10403156280517578, -0.10036277770996094, -0.0966939926147461, -0.09302520751953125, -0.0893564224243164, -0.08568763732910156, -0.08201885223388672, -0.07835006713867188, -0.07468128204345703, -0.07101249694824219, -0.06734371185302734, -0.0636749267578125, -0.060006141662597656, -0.05633735656738281, -0.05266857147216797, -0.048999786376953125, -0.04533100128173828, -0.04166221618652344, -0.037993431091308594, -0.03432464599609375, -0.030655860900878906, -0.026987075805664062, -0.02331829071044922, -0.019649505615234375, -0.01598072052001953, -0.012311935424804688, -0.008643150329589844, -0.004974365234375, -0.0013055801391601562, 0.0023632049560546875, 0.006031990051269531, 0.009700775146484375, 0.013369560241699219, 0.017038345336914062, 0.020707130432128906, 0.02437591552734375, 0.028044700622558594, 0.03171348571777344, 0.03538227081298828, 0.039051055908203125, 0.04271984100341797, 0.04638862609863281, 0.050057411193847656, 0.0537261962890625, 0.057394981384277344, 0.06106376647949219, 0.06473255157470703, 0.06840133666992188, 0.07207012176513672, 0.07573890686035156, 0.0794076919555664, 0.08307647705078125, 0.0867452621459961, 0.09041404724121094, 0.09408283233642578, 0.09775161743164062, 0.10142040252685547, 0.10508918762207031, 0.10875797271728516, 0.1124267578125]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 15.0, 44.0, 114.0, 256.0, 293.0, 176.0, 69.0, 25.0, 11.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1168487071990967, -2.006702184677124, -1.8965555429458618, -1.7864090204238892, -1.676262378692627, -1.5661158561706543, -1.4559693336486816, -1.345822811126709, -1.2356761693954468, -1.1255296468734741, -1.015383005142212, -0.9052364826202393, -0.7950899004936218, -0.6849433183670044, -0.5747967958450317, -0.4646502137184143, -0.3545036315917969, -0.24435706436634064, -0.1342104971408844, -0.024063944816589355, 0.08608263731002808, 0.1962292194366455, 0.30637574195861816, 0.4165223240852356, 0.526668906211853, 0.6368154883384705, 0.7469620704650879, 0.8571085929870605, 0.967255175113678, 1.0774017572402954, 1.187548279762268, 1.2976949214935303, 1.407841682434082, 1.5179882049560547, 1.628134846687317, 1.7382813692092896, 1.8484280109405518, 1.9585745334625244, 2.068721055984497, 2.1788675785064697, 2.2890143394470215, 2.399160861968994, 2.509307384490967, 2.6194539070129395, 2.729600667953491, 2.839747190475464, 2.9498937129974365, 3.060040235519409, 3.170186758041382, 3.2803332805633545, 3.390479803085327, 3.500626564025879, 3.6107730865478516, 3.720919609069824, 3.831066131591797, 3.9412126541137695, 4.051359176635742, 4.161505699157715, 4.2716522216796875, 4.38179874420166, 4.491945266723633, 4.6020917892456055, 4.712238311767578, 4.822385311126709, 4.932531833648682]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 6.0, 3.0, 5.0, 6.0, 8.0, 4.0, 10.0, 7.0, 7.0, 17.0, 24.0, 16.0, 20.0, 28.0, 38.0, 38.0, 33.0, 41.0, 45.0, 41.0, 53.0, 54.0, 44.0, 55.0, 47.0, 47.0, 41.0, 30.0, 35.0, 37.0, 26.0, 25.0, 24.0, 14.0, 15.0, 12.0, 13.0, 10.0, 8.0, 4.0, 7.0, 4.0, 3.0, 3.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.356858491897583, -1.3146865367889404, -1.2725145816802979, -1.2303426265716553, -1.1881706714630127, -1.1459985971450806, -1.103826642036438, -1.0616546869277954, -1.0194827318191528, -0.9773107767105103, -0.9351388216018677, -0.8929668068885803, -0.8507948517799377, -0.8086228966712952, -0.7664508819580078, -0.7242789268493652, -0.6821069717407227, -0.6399350166320801, -0.5977630615234375, -0.5555910468101501, -0.5134190917015076, -0.471247136592865, -0.4290751516819, -0.38690316677093506, -0.3447312116622925, -0.3025592565536499, -0.26038727164268494, -0.21821530163288116, -0.1760433316230774, -0.13387136161327362, -0.09169939160346985, -0.04952740669250488, -0.007355451583862305, 0.03481651842594147, 0.07698848843574524, 0.11916045844554901, 0.16133242845535278, 0.20350439846515656, 0.24567636847496033, 0.2878483533859253, 0.33002030849456787, 0.37219226360321045, 0.4143642485141754, 0.4565362334251404, 0.49870818853378296, 0.5408801436424255, 0.5830521583557129, 0.6252241134643555, 0.667396068572998, 0.7095680236816406, 0.7517399787902832, 0.7939119935035706, 0.8360839486122131, 0.8782559037208557, 0.9204279184341431, 0.9625998735427856, 1.0047718286514282, 1.0469437837600708, 1.0891157388687134, 1.131287693977356, 1.173459768295288, 1.2156317234039307, 1.2578036785125732, 1.2999756336212158, 1.3421475887298584]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 7.0, 6.0, 7.0, 16.0, 20.0, 28.0, 40.0, 62.0, 91.0, 152.0, 315.0, 727.0, 1863.0, 8247.0, 159653.0, 3612587.0, 394327.0, 12885.0, 2035.0, 641.0, 249.0, 121.0, 70.0, 49.0, 28.0, 22.0, 8.0, 10.0, 8.0, 2.0, 5.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.900390625, -1.851165771484375, -1.80194091796875, -1.752716064453125, -1.7034912109375, -1.654266357421875, -1.60504150390625, -1.555816650390625, -1.506591796875, -1.457366943359375, -1.40814208984375, -1.358917236328125, -1.3096923828125, -1.260467529296875, -1.21124267578125, -1.162017822265625, -1.11279296875, -1.063568115234375, -1.01434326171875, -0.965118408203125, -0.9158935546875, -0.866668701171875, -0.81744384765625, -0.768218994140625, -0.718994140625, -0.669769287109375, -0.62054443359375, -0.571319580078125, -0.5220947265625, -0.472869873046875, -0.42364501953125, -0.374420166015625, -0.3251953125, -0.275970458984375, -0.22674560546875, -0.177520751953125, -0.1282958984375, -0.079071044921875, -0.02984619140625, 0.019378662109375, 0.068603515625, 0.117828369140625, 0.16705322265625, 0.216278076171875, 0.2655029296875, 0.314727783203125, 0.36395263671875, 0.413177490234375, 0.46240234375, 0.511627197265625, 0.56085205078125, 0.610076904296875, 0.6593017578125, 0.708526611328125, 0.75775146484375, 0.806976318359375, 0.856201171875, 0.905426025390625, 0.95465087890625, 1.003875732421875, 1.0531005859375, 1.102325439453125, 1.15155029296875, 1.200775146484375, 1.25]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 1.0, 2.0, 5.0, 5.0, 3.0, 10.0, 14.0, 16.0, 17.0, 36.0, 36.0, 48.0, 56.0, 76.0, 72.0, 76.0, 77.0, 80.0, 57.0, 57.0, 50.0, 58.0, 36.0, 32.0, 19.0, 19.0, 17.0, 13.0, 8.0, 4.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.603515625, -0.57781982421875, -0.5521240234375, -0.52642822265625, -0.500732421875, -0.47503662109375, -0.4493408203125, -0.42364501953125, -0.39794921875, -0.37225341796875, -0.3465576171875, -0.32086181640625, -0.295166015625, -0.26947021484375, -0.2437744140625, -0.21807861328125, -0.1923828125, -0.16668701171875, -0.1409912109375, -0.11529541015625, -0.089599609375, -0.06390380859375, -0.0382080078125, -0.01251220703125, 0.01318359375, 0.03887939453125, 0.0645751953125, 0.09027099609375, 0.115966796875, 0.14166259765625, 0.1673583984375, 0.19305419921875, 0.21875, 0.24444580078125, 0.2701416015625, 0.29583740234375, 0.321533203125, 0.34722900390625, 0.3729248046875, 0.39862060546875, 0.42431640625, 0.45001220703125, 0.4757080078125, 0.50140380859375, 0.527099609375, 0.55279541015625, 0.5784912109375, 0.60418701171875, 0.6298828125, 0.65557861328125, 0.6812744140625, 0.70697021484375, 0.732666015625, 0.75836181640625, 0.7840576171875, 0.80975341796875, 0.83544921875, 0.86114501953125, 0.8868408203125, 0.91253662109375, 0.938232421875, 0.96392822265625, 0.9896240234375, 1.01531982421875, 1.041015625]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 6.0, 10.0, 18.0, 20.0, 44.0, 97.0, 179.0, 500.0, 1722.0, 11692.0, 1633841.0, 2529406.0, 13904.0, 1873.0, 553.0, 203.0, 99.0, 40.0, 26.0, 22.0, 13.0, 4.0, 7.0, 4.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.6484375, -2.588287353515625, -2.52813720703125, -2.467987060546875, -2.4078369140625, -2.347686767578125, -2.28753662109375, -2.227386474609375, -2.167236328125, -2.107086181640625, -2.04693603515625, -1.986785888671875, -1.9266357421875, -1.866485595703125, -1.80633544921875, -1.746185302734375, -1.68603515625, -1.625885009765625, -1.56573486328125, -1.505584716796875, -1.4454345703125, -1.385284423828125, -1.32513427734375, -1.264984130859375, -1.204833984375, -1.144683837890625, -1.08453369140625, -1.024383544921875, -0.9642333984375, -0.904083251953125, -0.84393310546875, -0.783782958984375, -0.7236328125, -0.663482666015625, -0.60333251953125, -0.543182373046875, -0.4830322265625, -0.422882080078125, -0.36273193359375, -0.302581787109375, -0.242431640625, -0.182281494140625, -0.12213134765625, -0.061981201171875, -0.0018310546875, 0.058319091796875, 0.11846923828125, 0.178619384765625, 0.23876953125, 0.298919677734375, 0.35906982421875, 0.419219970703125, 0.4793701171875, 0.539520263671875, 0.59967041015625, 0.659820556640625, 0.719970703125, 0.780120849609375, 0.84027099609375, 0.900421142578125, 0.9605712890625, 1.020721435546875, 1.08087158203125, 1.141021728515625, 1.201171875]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 3.0, 1.0, 14.0, 10.0, 14.0, 15.0, 23.0, 39.0, 57.0, 88.0, 102.0, 171.0, 294.0, 442.0, 656.0, 683.0, 509.0, 357.0, 219.0, 122.0, 77.0, 58.0, 38.0, 22.0, 17.0, 15.0, 12.0, 5.0, 4.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.22607421875, -0.21882057189941406, -0.21156692504882812, -0.2043132781982422, -0.19705963134765625, -0.1898059844970703, -0.18255233764648438, -0.17529869079589844, -0.1680450439453125, -0.16079139709472656, -0.15353775024414062, -0.1462841033935547, -0.13903045654296875, -0.1317768096923828, -0.12452316284179688, -0.11726951599121094, -0.110015869140625, -0.10276222229003906, -0.09550857543945312, -0.08825492858886719, -0.08100128173828125, -0.07374763488769531, -0.06649398803710938, -0.05924034118652344, -0.0519866943359375, -0.04473304748535156, -0.037479400634765625, -0.030225753784179688, -0.02297210693359375, -0.015718460083007812, -0.008464813232421875, -0.0012111663818359375, 0.00604248046875, 0.013296127319335938, 0.020549774169921875, 0.027803421020507812, 0.03505706787109375, 0.04231071472167969, 0.049564361572265625, 0.05681800842285156, 0.0640716552734375, 0.07132530212402344, 0.07857894897460938, 0.08583259582519531, 0.09308624267578125, 0.10033988952636719, 0.10759353637695312, 0.11484718322753906, 0.122100830078125, 0.12935447692871094, 0.13660812377929688, 0.1438617706298828, 0.15111541748046875, 0.1583690643310547, 0.16562271118164062, 0.17287635803222656, 0.1801300048828125, 0.18738365173339844, 0.19463729858398438, 0.2018909454345703, 0.20914459228515625, 0.2163982391357422, 0.22365188598632812, 0.23090553283691406, 0.2381591796875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 8.0, 30.0, 40.0, 72.0, 143.0, 198.0, 222.0, 151.0, 66.0, 42.0, 25.0, 4.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.8788716793060303, -2.8188812732696533, -2.7588911056518555, -2.6989006996154785, -2.6389105319976807, -2.5789201259613037, -2.518929958343506, -2.458939552307129, -2.398949384689331, -2.338958978652954, -2.2789688110351562, -2.2189784049987793, -2.1589882373809814, -2.0989978313446045, -2.0390076637268066, -1.9790172576904297, -1.9190269708633423, -1.8590366840362549, -1.7990463972091675, -1.73905611038208, -1.6790658235549927, -1.6190755367279053, -1.5590851306915283, -1.4990949630737305, -1.4391045570373535, -1.3791142702102661, -1.3191239833831787, -1.2591336965560913, -1.199143409729004, -1.1391531229019165, -1.079162836074829, -1.0191724300384521, -0.9591822028160095, -0.8991919159889221, -0.8392016291618347, -0.7792112827301025, -0.7192209959030151, -0.6592307090759277, -0.5992404222488403, -0.5392501354217529, -0.4792598485946655, -0.4192695617675781, -0.3592792749404907, -0.29928895831108093, -0.23929867148399353, -0.17930838465690613, -0.11931806802749634, -0.059327781200408936, 0.0006625056266784668, 0.060652799904346466, 0.12064309418201447, 0.18063339591026306, 0.24062368273735046, 0.30061396956443787, 0.36060428619384766, 0.42059457302093506, 0.48058485984802246, 0.5405751466751099, 0.6005654335021973, 0.6605557203292847, 0.7205460071563721, 0.7805362939834595, 0.8405266404151917, 0.900516927242279, 0.9605072140693665]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 5.0, 6.0, 8.0, 11.0, 11.0, 19.0, 26.0, 24.0, 22.0, 25.0, 47.0, 41.0, 40.0, 48.0, 52.0, 54.0, 46.0, 49.0, 59.0, 47.0, 49.0, 46.0, 38.0, 35.0, 38.0, 27.0, 24.0, 20.0, 18.0, 13.0, 12.0, 9.0, 9.0, 2.0, 2.0, 9.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6236315369606018, -0.6038021445274353, -0.5839727520942688, -0.5641433596611023, -0.5443139672279358, -0.5244845747947693, -0.5046551823616028, -0.48482581973075867, -0.46499642729759216, -0.44516703486442566, -0.42533764243125916, -0.40550824999809265, -0.38567888736724854, -0.36584949493408203, -0.3460201025009155, -0.326190710067749, -0.3063613176345825, -0.286531925201416, -0.2667025327682495, -0.2468731552362442, -0.2270437628030777, -0.2072143703699112, -0.18738499283790588, -0.16755560040473938, -0.14772620797157288, -0.12789681553840637, -0.10806743055582047, -0.08823804557323456, -0.06840865314006805, -0.04857926070690155, -0.028749875724315643, -0.008920490741729736, 0.010908961296081543, 0.03073835000395775, 0.050567738711833954, 0.07039712369441986, 0.09022651612758636, 0.11005590856075287, 0.12988528609275818, 0.14971467852592468, 0.1695440709590912, 0.1893734633922577, 0.2092028558254242, 0.2290322333574295, 0.248861625790596, 0.2686910033226013, 0.2885203957557678, 0.3083497881889343, 0.32817918062210083, 0.34800857305526733, 0.36783796548843384, 0.38766735792160034, 0.40749675035476685, 0.42732614278793335, 0.44715550541877747, 0.46698489785194397, 0.4868142902851105, 0.5066436529159546, 0.5264730453491211, 0.5463024377822876, 0.5661318302154541, 0.5859612226486206, 0.6057906150817871, 0.6256200075149536, 0.6454493999481201]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 4.0, 8.0, 11.0, 15.0, 15.0, 39.0, 77.0, 229.0, 511.0, 1365.0, 3847.0, 14853.0, 138325.0, 762772.0, 107699.0, 13169.0, 3612.0, 1214.0, 426.0, 193.0, 72.0, 30.0, 20.0, 14.0, 5.0, 9.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.33837890625, -0.3279533386230469, -0.31752777099609375, -0.3071022033691406, -0.2966766357421875, -0.2862510681152344, -0.27582550048828125, -0.2653999328613281, -0.254974365234375, -0.24454879760742188, -0.23412322998046875, -0.22369766235351562, -0.2132720947265625, -0.20284652709960938, -0.19242095947265625, -0.18199539184570312, -0.17156982421875, -0.16114425659179688, -0.15071868896484375, -0.14029312133789062, -0.1298675537109375, -0.11944198608398438, -0.10901641845703125, -0.09859085083007812, -0.088165283203125, -0.07773971557617188, -0.06731414794921875, -0.056888580322265625, -0.0464630126953125, -0.036037445068359375, -0.02561187744140625, -0.015186309814453125, -0.0047607421875, 0.005664825439453125, 0.01609039306640625, 0.026515960693359375, 0.0369415283203125, 0.047367095947265625, 0.05779266357421875, 0.06821823120117188, 0.078643798828125, 0.08906936645507812, 0.09949493408203125, 0.10992050170898438, 0.1203460693359375, 0.13077163696289062, 0.14119720458984375, 0.15162277221679688, 0.16204833984375, 0.17247390747070312, 0.18289947509765625, 0.19332504272460938, 0.2037506103515625, 0.21417617797851562, 0.22460174560546875, 0.23502731323242188, 0.245452880859375, 0.2558784484863281, 0.26630401611328125, 0.2767295837402344, 0.2871551513671875, 0.2975807189941406, 0.30800628662109375, 0.3184318542480469, 0.328857421875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 6.0, 3.0, 1.0, 4.0, 9.0, 7.0, 7.0, 14.0, 18.0, 15.0, 24.0, 22.0, 26.0, 35.0, 44.0, 46.0, 40.0, 46.0, 50.0, 46.0, 60.0, 53.0, 56.0, 53.0, 50.0, 41.0, 39.0, 30.0, 33.0, 25.0, 16.0, 21.0, 14.0, 8.0, 8.0, 9.0, 8.0, 5.0, 6.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.420166015625, -0.406402587890625, -0.39263916015625, -0.378875732421875, -0.3651123046875, -0.351348876953125, -0.33758544921875, -0.323822021484375, -0.31005859375, -0.296295166015625, -0.28253173828125, -0.268768310546875, -0.2550048828125, -0.241241455078125, -0.22747802734375, -0.213714599609375, -0.199951171875, -0.186187744140625, -0.17242431640625, -0.158660888671875, -0.1448974609375, -0.131134033203125, -0.11737060546875, -0.103607177734375, -0.08984375, -0.076080322265625, -0.06231689453125, -0.048553466796875, -0.0347900390625, -0.021026611328125, -0.00726318359375, 0.006500244140625, 0.020263671875, 0.034027099609375, 0.04779052734375, 0.061553955078125, 0.0753173828125, 0.089080810546875, 0.10284423828125, 0.116607666015625, 0.13037109375, 0.144134521484375, 0.15789794921875, 0.171661376953125, 0.1854248046875, 0.199188232421875, 0.21295166015625, 0.226715087890625, 0.240478515625, 0.254241943359375, 0.26800537109375, 0.281768798828125, 0.2955322265625, 0.309295654296875, 0.32305908203125, 0.336822509765625, 0.3505859375, 0.364349365234375, 0.37811279296875, 0.391876220703125, 0.4056396484375, 0.419403076171875, 0.43316650390625, 0.446929931640625, 0.460693359375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 4.0, 7.0, 4.0, 11.0, 11.0, 13.0, 16.0, 22.0, 40.0, 34.0, 67.0, 93.0, 141.0, 174.0, 261.0, 383.0, 566.0, 935.0, 1511.0, 2565.0, 4546.0, 9082.0, 21226.0, 59936.0, 180448.0, 359296.0, 257055.0, 92497.0, 31163.0, 12191.0, 5821.0, 3139.0, 1842.0, 1175.0, 752.0, 492.0, 321.0, 191.0, 138.0, 95.0, 86.0, 52.0, 34.0, 21.0, 24.0, 16.0, 9.0, 13.0, 10.0, 6.0, 7.0, 6.0, 6.0, 2.0, 2.0, 3.0, 2.0], "bins": [-0.11712646484375, -0.11354351043701172, -0.10996055603027344, -0.10637760162353516, -0.10279464721679688, -0.0992116928100586, -0.09562873840332031, -0.09204578399658203, -0.08846282958984375, -0.08487987518310547, -0.08129692077636719, -0.0777139663696289, -0.07413101196289062, -0.07054805755615234, -0.06696510314941406, -0.06338214874267578, -0.0597991943359375, -0.05621623992919922, -0.05263328552246094, -0.049050331115722656, -0.045467376708984375, -0.041884422302246094, -0.03830146789550781, -0.03471851348876953, -0.03113555908203125, -0.02755260467529297, -0.023969650268554688, -0.020386695861816406, -0.016803741455078125, -0.013220787048339844, -0.009637832641601562, -0.006054878234863281, -0.002471923828125, 0.0011110305786132812, 0.0046939849853515625, 0.008276939392089844, 0.011859893798828125, 0.015442848205566406, 0.019025802612304688, 0.02260875701904297, 0.02619171142578125, 0.02977466583251953, 0.03335762023925781, 0.036940574645996094, 0.040523529052734375, 0.044106483459472656, 0.04768943786621094, 0.05127239227294922, 0.0548553466796875, 0.05843830108642578, 0.06202125549316406, 0.06560420989990234, 0.06918716430664062, 0.0727701187133789, 0.07635307312011719, 0.07993602752685547, 0.08351898193359375, 0.08710193634033203, 0.09068489074707031, 0.0942678451538086, 0.09785079956054688, 0.10143375396728516, 0.10501670837402344, 0.10859966278076172, 0.1121826171875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 4.0, 0.0, 7.0, 4.0, 3.0, 9.0, 10.0, 14.0, 19.0, 15.0, 8.0, 15.0, 19.0, 26.0, 36.0, 23.0, 33.0, 32.0, 36.0, 53.0, 43.0, 47.0, 38.0, 50.0, 47.0, 50.0, 49.0, 36.0, 36.0, 31.0, 25.0, 40.0, 21.0, 17.0, 20.0, 13.0, 14.0, 8.0, 3.0, 14.0, 5.0, 6.0, 7.0, 2.0, 2.0, 6.0, 2.0, 1.0, 1.0, 4.0, 2.0, 1.0, 1.0, 3.0], "bins": [-0.728515625, -0.7064666748046875, -0.684417724609375, -0.6623687744140625, -0.64031982421875, -0.6182708740234375, -0.596221923828125, -0.5741729736328125, -0.5521240234375, -0.5300750732421875, -0.508026123046875, -0.4859771728515625, -0.46392822265625, -0.4418792724609375, -0.419830322265625, -0.3977813720703125, -0.375732421875, -0.3536834716796875, -0.331634521484375, -0.3095855712890625, -0.28753662109375, -0.2654876708984375, -0.243438720703125, -0.2213897705078125, -0.1993408203125, -0.1772918701171875, -0.155242919921875, -0.1331939697265625, -0.11114501953125, -0.0890960693359375, -0.067047119140625, -0.0449981689453125, -0.02294921875, -0.0009002685546875, 0.021148681640625, 0.0431976318359375, 0.06524658203125, 0.0872955322265625, 0.109344482421875, 0.1313934326171875, 0.1534423828125, 0.1754913330078125, 0.197540283203125, 0.2195892333984375, 0.24163818359375, 0.2636871337890625, 0.285736083984375, 0.3077850341796875, 0.329833984375, 0.3518829345703125, 0.373931884765625, 0.3959808349609375, 0.41802978515625, 0.4400787353515625, 0.462127685546875, 0.4841766357421875, 0.5062255859375, 0.5282745361328125, 0.550323486328125, 0.5723724365234375, 0.59442138671875, 0.6164703369140625, 0.638519287109375, 0.6605682373046875, 0.6826171875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 5.0, 16.0, 21.0, 37.0, 45.0, 95.0, 162.0, 241.0, 496.0, 849.0, 1796.0, 4156.0, 10679.0, 35453.0, 163746.0, 504383.0, 249867.0, 52398.0, 14398.0, 5289.0, 2146.0, 1067.0, 500.0, 291.0, 137.0, 96.0, 81.0, 36.0, 25.0, 13.0, 8.0, 9.0, 4.0, 2.0, 3.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.057281494140625, -0.05562782287597656, -0.053974151611328125, -0.05232048034667969, -0.05066680908203125, -0.04901313781738281, -0.047359466552734375, -0.04570579528808594, -0.0440521240234375, -0.04239845275878906, -0.040744781494140625, -0.03909111022949219, -0.03743743896484375, -0.03578376770019531, -0.034130096435546875, -0.03247642517089844, -0.03082275390625, -0.029169082641601562, -0.027515411376953125, -0.025861740112304688, -0.02420806884765625, -0.022554397583007812, -0.020900726318359375, -0.019247055053710938, -0.0175933837890625, -0.015939712524414062, -0.014286041259765625, -0.012632369995117188, -0.01097869873046875, -0.009325027465820312, -0.007671356201171875, -0.0060176849365234375, -0.004364013671875, -0.0027103424072265625, -0.001056671142578125, 0.0005970001220703125, 0.00225067138671875, 0.0039043426513671875, 0.005558013916015625, 0.0072116851806640625, 0.0088653564453125, 0.010519027709960938, 0.012172698974609375, 0.013826370239257812, 0.01548004150390625, 0.017133712768554688, 0.018787384033203125, 0.020441055297851562, 0.0220947265625, 0.023748397827148438, 0.025402069091796875, 0.027055740356445312, 0.02870941162109375, 0.030363082885742188, 0.032016754150390625, 0.03367042541503906, 0.0353240966796875, 0.03697776794433594, 0.038631439208984375, 0.04028511047363281, 0.04193878173828125, 0.04359245300292969, 0.045246124267578125, 0.04689979553222656, 0.048553466796875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 5.0, 14.0, 19.0, 36.0, 119.0, 186.0, 256.0, 174.0, 95.0, 59.0, 14.0, 7.0, 6.0, 6.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.82012939453125e-05, -7.626786828041077e-05, -7.433444261550903e-05, -7.24010169506073e-05, -7.046759128570557e-05, -6.853416562080383e-05, -6.66007399559021e-05, -6.466731429100037e-05, -6.273388862609863e-05, -6.08004629611969e-05, -5.8867037296295166e-05, -5.693361163139343e-05, -5.50001859664917e-05, -5.3066760301589966e-05, -5.113333463668823e-05, -4.91999089717865e-05, -4.7266483306884766e-05, -4.533305764198303e-05, -4.33996319770813e-05, -4.1466206312179565e-05, -3.953278064727783e-05, -3.75993549823761e-05, -3.5665929317474365e-05, -3.373250365257263e-05, -3.17990779876709e-05, -2.9865652322769165e-05, -2.793222665786743e-05, -2.5998800992965698e-05, -2.4065375328063965e-05, -2.213194966316223e-05, -2.0198523998260498e-05, -1.8265098333358765e-05, -1.633167266845703e-05, -1.4398247003555298e-05, -1.2464821338653564e-05, -1.0531395673751831e-05, -8.597970008850098e-06, -6.664544343948364e-06, -4.731118679046631e-06, -2.7976930141448975e-06, -8.642673492431641e-07, 1.0691583156585693e-06, 3.0025839805603027e-06, 4.936009645462036e-06, 6.8694353103637695e-06, 8.802860975265503e-06, 1.0736286640167236e-05, 1.266971230506897e-05, 1.4603137969970703e-05, 1.6536563634872437e-05, 1.846998929977417e-05, 2.0403414964675903e-05, 2.2336840629577637e-05, 2.427026629447937e-05, 2.6203691959381104e-05, 2.8137117624282837e-05, 3.007054328918457e-05, 3.2003968954086304e-05, 3.393739461898804e-05, 3.587082028388977e-05, 3.7804245948791504e-05, 3.973767161369324e-05, 4.167109727859497e-05, 4.3604522943496704e-05, 4.553794860839844e-05]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 4.0, 5.0, 3.0, 2.0, 6.0, 2.0, 11.0, 11.0, 24.0, 43.0, 35.0, 76.0, 113.0, 189.0, 302.0, 581.0, 1062.0, 2305.0, 5574.0, 17349.0, 71619.0, 296072.0, 447114.0, 154209.0, 34965.0, 9753.0, 3705.0, 1606.0, 767.0, 412.0, 224.0, 139.0, 83.0, 55.0, 36.0, 26.0, 29.0, 13.0, 10.0, 8.0, 4.0, 6.0, 3.0, 3.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.04486083984375, -0.043425559997558594, -0.04199028015136719, -0.04055500030517578, -0.039119720458984375, -0.03768444061279297, -0.03624916076660156, -0.034813880920410156, -0.03337860107421875, -0.031943321228027344, -0.030508041381835938, -0.02907276153564453, -0.027637481689453125, -0.02620220184326172, -0.024766921997070312, -0.023331642150878906, -0.0218963623046875, -0.020461082458496094, -0.019025802612304688, -0.01759052276611328, -0.016155242919921875, -0.014719963073730469, -0.013284683227539062, -0.011849403381347656, -0.01041412353515625, -0.008978843688964844, -0.0075435638427734375, -0.006108283996582031, -0.004673004150390625, -0.0032377243041992188, -0.0018024444580078125, -0.00036716461181640625, 0.001068115234375, 0.0025033950805664062, 0.0039386749267578125, 0.005373954772949219, 0.006809234619140625, 0.008244514465332031, 0.009679794311523438, 0.011115074157714844, 0.01255035400390625, 0.013985633850097656, 0.015420913696289062, 0.01685619354248047, 0.018291473388671875, 0.01972675323486328, 0.021162033081054688, 0.022597312927246094, 0.0240325927734375, 0.025467872619628906, 0.026903152465820312, 0.02833843231201172, 0.029773712158203125, 0.03120899200439453, 0.03264427185058594, 0.034079551696777344, 0.03551483154296875, 0.036950111389160156, 0.03838539123535156, 0.03982067108154297, 0.041255950927734375, 0.04269123077392578, 0.04412651062011719, 0.045561790466308594, 0.0469970703125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 3.0, 2.0, 4.0, 10.0, 4.0, 10.0, 14.0, 13.0, 22.0, 28.0, 35.0, 58.0, 60.0, 84.0, 79.0, 84.0, 76.0, 77.0, 80.0, 60.0, 53.0, 41.0, 26.0, 16.0, 18.0, 17.0, 8.0, 3.0, 6.0, 4.0, 2.0, 6.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.01544952392578125, -0.015019059181213379, -0.014588594436645508, -0.014158129692077637, -0.013727664947509766, -0.013297200202941895, -0.012866735458374023, -0.012436270713806152, -0.012005805969238281, -0.01157534122467041, -0.011144876480102539, -0.010714411735534668, -0.010283946990966797, -0.009853482246398926, -0.009423017501831055, -0.008992552757263184, -0.008562088012695312, -0.008131623268127441, -0.00770115852355957, -0.007270693778991699, -0.006840229034423828, -0.006409764289855957, -0.005979299545288086, -0.005548834800720215, -0.005118370056152344, -0.004687905311584473, -0.0042574405670166016, -0.0038269758224487305, -0.0033965110778808594, -0.0029660463333129883, -0.002535581588745117, -0.002105116844177246, -0.001674652099609375, -0.001244187355041504, -0.0008137226104736328, -0.0003832578659057617, 4.7206878662109375e-05, 0.00047767162322998047, 0.0009081363677978516, 0.0013386011123657227, 0.0017690658569335938, 0.002199530601501465, 0.002629995346069336, 0.003060460090637207, 0.003490924835205078, 0.003921389579772949, 0.00435185432434082, 0.004782319068908691, 0.0052127838134765625, 0.005643248558044434, 0.006073713302612305, 0.006504178047180176, 0.006934642791748047, 0.007365107536315918, 0.007795572280883789, 0.00822603702545166, 0.008656501770019531, 0.009086966514587402, 0.009517431259155273, 0.009947896003723145, 0.010378360748291016, 0.010808825492858887, 0.011239290237426758, 0.011669754981994629, 0.0121002197265625]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 56.0, 556.0, 378.0, 25.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.198397636413574, -8.048991203308105, -7.899584770202637, -7.750178337097168, -7.600771903991699, -7.4513654708862305, -7.301959037780762, -7.152552604675293, -7.003146171569824, -6.8537397384643555, -6.704333305358887, -6.554926872253418, -6.405520439147949, -6.2561140060424805, -6.106707572937012, -5.957301139831543, -5.807894706726074, -5.6584882736206055, -5.509081840515137, -5.359675407409668, -5.210268974304199, -5.0608625411987305, -4.911456108093262, -4.762049674987793, -4.612643718719482, -4.463237285614014, -4.313830852508545, -4.164424419403076, -4.015017986297607, -3.8656115531921387, -3.71620512008667, -3.566798686981201, -3.4173922538757324, -3.2679858207702637, -3.118579387664795, -2.969172954559326, -2.8197665214538574, -2.6703600883483887, -2.52095365524292, -2.371547222137451, -2.2221407890319824, -2.0727343559265137, -1.923327922821045, -1.7739214897155762, -1.6245150566101074, -1.4751086235046387, -1.3257023096084595, -1.1762958765029907, -1.0268895626068115, -0.8774831295013428, -0.728076696395874, -0.57867032289505, -0.4292638897895813, -0.27985745668411255, -0.13045108318328857, 0.018955349922180176, 0.16836178302764893, 0.3177682161331177, 0.46717461943626404, 0.6165810227394104, 0.7659874558448792, 0.9153938889503479, 1.0648002624511719, 1.2142066955566406, 1.3636131286621094]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 6.0, 3.0, 3.0, 10.0, 8.0, 8.0, 19.0, 18.0, 29.0, 20.0, 33.0, 34.0, 45.0, 44.0, 47.0, 61.0, 61.0, 54.0, 49.0, 61.0, 50.0, 49.0, 43.0, 50.0, 39.0, 29.0, 23.0, 25.0, 17.0, 14.0, 13.0, 9.0, 3.0, 7.0, 5.0, 4.0, 6.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.4294917583465576, -0.4152313470840454, -0.4009709656238556, -0.38671058416366577, -0.37245017290115356, -0.35818976163864136, -0.34392938017845154, -0.3296689987182617, -0.3154085874557495, -0.3011481761932373, -0.2868877947330475, -0.27262741327285767, -0.25836700201034546, -0.24410660564899445, -0.22984620928764343, -0.21558581292629242, -0.2013254165649414, -0.1870650202035904, -0.17280462384223938, -0.15854422748088837, -0.14428383111953735, -0.13002343475818634, -0.11576303839683533, -0.10150264203548431, -0.0872422456741333, -0.07298184931278229, -0.058721452951431274, -0.04446105659008026, -0.030200660228729248, -0.015940263867378235, -0.0016798675060272217, 0.012580528855323792, 0.026840955018997192, 0.041101351380348206, 0.05536174774169922, 0.06962214410305023, 0.08388254046440125, 0.09814293682575226, 0.11240333318710327, 0.12666372954845428, 0.1409241259098053, 0.1551845222711563, 0.16944491863250732, 0.18370531499385834, 0.19796571135520935, 0.21222610771656036, 0.22648650407791138, 0.2407469004392624, 0.2550072968006134, 0.2692676782608032, 0.28352808952331543, 0.29778850078582764, 0.31204888224601746, 0.3263092637062073, 0.3405696749687195, 0.3548300862312317, 0.3690904676914215, 0.38335084915161133, 0.39761126041412354, 0.41187167167663574, 0.42613205313682556, 0.4403924345970154, 0.4546528458595276, 0.4689132571220398, 0.4831736385822296]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 2.0, 1.0, 6.0, 4.0, 10.0, 16.0, 17.0, 36.0, 67.0, 93.0, 161.0, 306.0, 693.0, 1616.0, 4225.0, 14127.0, 86981.0, 700633.0, 205871.0, 23509.0, 6178.0, 2228.0, 892.0, 399.0, 210.0, 92.0, 64.0, 35.0, 24.0, 18.0, 16.0, 7.0, 5.0, 9.0, 2.0, 0.0, 1.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.861328125, -0.8357467651367188, -0.8101654052734375, -0.7845840454101562, -0.759002685546875, -0.7334213256835938, -0.7078399658203125, -0.6822586059570312, -0.65667724609375, -0.6310958862304688, -0.6055145263671875, -0.5799331665039062, -0.554351806640625, -0.5287704467773438, -0.5031890869140625, -0.47760772705078125, -0.4520263671875, -0.42644500732421875, -0.4008636474609375, -0.37528228759765625, -0.349700927734375, -0.32411956787109375, -0.2985382080078125, -0.27295684814453125, -0.24737548828125, -0.22179412841796875, -0.1962127685546875, -0.17063140869140625, -0.145050048828125, -0.11946868896484375, -0.0938873291015625, -0.06830596923828125, -0.042724609375, -0.01714324951171875, 0.0084381103515625, 0.03401947021484375, 0.059600830078125, 0.08518218994140625, 0.1107635498046875, 0.13634490966796875, 0.16192626953125, 0.18750762939453125, 0.2130889892578125, 0.23867034912109375, 0.264251708984375, 0.28983306884765625, 0.3154144287109375, 0.34099578857421875, 0.3665771484375, 0.39215850830078125, 0.4177398681640625, 0.44332122802734375, 0.468902587890625, 0.49448394775390625, 0.5200653076171875, 0.5456466674804688, 0.57122802734375, 0.5968093872070312, 0.6223907470703125, 0.6479721069335938, 0.673553466796875, 0.6991348266601562, 0.7247161865234375, 0.7502975463867188, 0.77587890625]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 7.0, 7.0, 15.0, 13.0, 20.0, 36.0, 32.0, 59.0, 70.0, 79.0, 84.0, 88.0, 96.0, 81.0, 72.0, 74.0, 46.0, 36.0, 25.0, 18.0, 13.0, 9.0, 6.0, 9.0, 4.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.78369140625, -0.7421798706054688, -0.7006683349609375, -0.6591567993164062, -0.617645263671875, -0.5761337280273438, -0.5346221923828125, -0.49311065673828125, -0.45159912109375, -0.41008758544921875, -0.3685760498046875, -0.32706451416015625, -0.285552978515625, -0.24404144287109375, -0.2025299072265625, -0.16101837158203125, -0.1195068359375, -0.07799530029296875, -0.0364837646484375, 0.00502777099609375, 0.046539306640625, 0.08805084228515625, 0.1295623779296875, 0.17107391357421875, 0.21258544921875, 0.25409698486328125, 0.2956085205078125, 0.33712005615234375, 0.378631591796875, 0.42014312744140625, 0.4616546630859375, 0.5031661987304688, 0.544677734375, 0.5861892700195312, 0.6277008056640625, 0.6692123413085938, 0.710723876953125, 0.7522354125976562, 0.7937469482421875, 0.8352584838867188, 0.87677001953125, 0.9182815551757812, 0.9597930908203125, 1.0013046264648438, 1.042816162109375, 1.0843276977539062, 1.1258392333984375, 1.1673507690429688, 1.2088623046875, 1.2503738403320312, 1.2918853759765625, 1.3333969116210938, 1.374908447265625, 1.4164199829101562, 1.4579315185546875, 1.4994430541992188, 1.54095458984375, 1.5824661254882812, 1.6239776611328125, 1.6654891967773438, 1.707000732421875, 1.7485122680664062, 1.7900238037109375, 1.8315353393554688, 1.873046875]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 3.0, 5.0, 5.0, 1.0, 8.0, 5.0, 14.0, 10.0, 23.0, 31.0, 52.0, 78.0, 162.0, 263.0, 486.0, 1058.0, 4007.0, 30004.0, 839672.0, 159977.0, 9153.0, 1969.0, 710.0, 322.0, 198.0, 110.0, 61.0, 48.0, 38.0, 16.0, 19.0, 14.0, 5.0, 3.0, 4.0, 5.0, 2.0, 3.0, 4.0, 0.0, 0.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1494140625, -1.1107635498046875, -1.072113037109375, -1.0334625244140625, -0.99481201171875, -0.9561614990234375, -0.917510986328125, -0.8788604736328125, -0.8402099609375, -0.8015594482421875, -0.762908935546875, -0.7242584228515625, -0.68560791015625, -0.6469573974609375, -0.608306884765625, -0.5696563720703125, -0.531005859375, -0.4923553466796875, -0.453704833984375, -0.4150543212890625, -0.37640380859375, -0.3377532958984375, -0.299102783203125, -0.2604522705078125, -0.2218017578125, -0.1831512451171875, -0.144500732421875, -0.1058502197265625, -0.06719970703125, -0.0285491943359375, 0.010101318359375, 0.0487518310546875, 0.08740234375, 0.1260528564453125, 0.164703369140625, 0.2033538818359375, 0.24200439453125, 0.2806549072265625, 0.319305419921875, 0.3579559326171875, 0.3966064453125, 0.4352569580078125, 0.473907470703125, 0.5125579833984375, 0.55120849609375, 0.5898590087890625, 0.628509521484375, 0.6671600341796875, 0.705810546875, 0.7444610595703125, 0.783111572265625, 0.8217620849609375, 0.86041259765625, 0.8990631103515625, 0.937713623046875, 0.9763641357421875, 1.0150146484375, 1.0536651611328125, 1.092315673828125, 1.1309661865234375, 1.16961669921875, 1.2082672119140625, 1.246917724609375, 1.2855682373046875, 1.32421875]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 2.0, 2.0, 2.0, 7.0, 13.0, 11.0, 11.0, 11.0, 13.0, 19.0, 25.0, 13.0, 26.0, 32.0, 31.0, 40.0, 43.0, 46.0, 48.0, 47.0, 41.0, 49.0, 42.0, 43.0, 43.0, 37.0, 47.0, 30.0, 46.0, 26.0, 21.0, 26.0, 14.0, 17.0, 13.0, 11.0, 23.0, 3.0, 8.0, 8.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.796875, -0.7696533203125, -0.742431640625, -0.7152099609375, -0.68798828125, -0.6607666015625, -0.633544921875, -0.6063232421875, -0.5791015625, -0.5518798828125, -0.524658203125, -0.4974365234375, -0.47021484375, -0.4429931640625, -0.415771484375, -0.3885498046875, -0.361328125, -0.3341064453125, -0.306884765625, -0.2796630859375, -0.25244140625, -0.2252197265625, -0.197998046875, -0.1707763671875, -0.1435546875, -0.1163330078125, -0.089111328125, -0.0618896484375, -0.03466796875, -0.0074462890625, 0.019775390625, 0.0469970703125, 0.07421875, 0.1014404296875, 0.128662109375, 0.1558837890625, 0.18310546875, 0.2103271484375, 0.237548828125, 0.2647705078125, 0.2919921875, 0.3192138671875, 0.346435546875, 0.3736572265625, 0.40087890625, 0.4281005859375, 0.455322265625, 0.4825439453125, 0.509765625, 0.5369873046875, 0.564208984375, 0.5914306640625, 0.61865234375, 0.6458740234375, 0.673095703125, 0.7003173828125, 0.7275390625, 0.7547607421875, 0.781982421875, 0.8092041015625, 0.83642578125, 0.8636474609375, 0.890869140625, 0.9180908203125, 0.9453125]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 3.0, 11.0, 9.0, 10.0, 22.0, 19.0, 68.0, 100.0, 255.0, 785.0, 2964.0, 23569.0, 943674.0, 70468.0, 4832.0, 1123.0, 339.0, 140.0, 60.0, 40.0, 16.0, 10.0, 11.0, 4.0, 6.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.515625, -0.4998321533203125, -0.484039306640625, -0.4682464599609375, -0.45245361328125, -0.4366607666015625, -0.420867919921875, -0.4050750732421875, -0.3892822265625, -0.3734893798828125, -0.357696533203125, -0.3419036865234375, -0.32611083984375, -0.3103179931640625, -0.294525146484375, -0.2787322998046875, -0.262939453125, -0.2471466064453125, -0.231353759765625, -0.2155609130859375, -0.19976806640625, -0.1839752197265625, -0.168182373046875, -0.1523895263671875, -0.1365966796875, -0.1208038330078125, -0.105010986328125, -0.0892181396484375, -0.07342529296875, -0.0576324462890625, -0.041839599609375, -0.0260467529296875, -0.01025390625, 0.0055389404296875, 0.021331787109375, 0.0371246337890625, 0.05291748046875, 0.0687103271484375, 0.084503173828125, 0.1002960205078125, 0.1160888671875, 0.1318817138671875, 0.147674560546875, 0.1634674072265625, 0.17926025390625, 0.1950531005859375, 0.210845947265625, 0.2266387939453125, 0.242431640625, 0.2582244873046875, 0.274017333984375, 0.2898101806640625, 0.30560302734375, 0.3213958740234375, 0.337188720703125, 0.3529815673828125, 0.3687744140625, 0.3845672607421875, 0.400360107421875, 0.4161529541015625, 0.43194580078125, 0.4477386474609375, 0.463531494140625, 0.4793243408203125, 0.4951171875]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 3.0, 2.0, 2.0, 4.0, 9.0, 7.0, 14.0, 17.0, 14.0, 41.0, 67.0, 90.0, 139.0, 168.0, 128.0, 97.0, 71.0, 38.0, 25.0, 17.0, 17.0, 10.0, 2.0, 5.0, 3.0, 2.0, 3.0, 7.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.236532211303711e-05, -3.114994615316391e-05, -2.993457019329071e-05, -2.871919423341751e-05, -2.750381827354431e-05, -2.6288442313671112e-05, -2.5073066353797913e-05, -2.3857690393924713e-05, -2.2642314434051514e-05, -2.1426938474178314e-05, -2.0211562514305115e-05, -1.8996186554431915e-05, -1.7780810594558716e-05, -1.6565434634685516e-05, -1.5350058674812317e-05, -1.4134682714939117e-05, -1.2919306755065918e-05, -1.1703930795192719e-05, -1.0488554835319519e-05, -9.27317887544632e-06, -8.05780291557312e-06, -6.842426955699921e-06, -5.627050995826721e-06, -4.411675035953522e-06, -3.1962990760803223e-06, -1.980923116207123e-06, -7.655471563339233e-07, 4.498288035392761e-07, 1.6652047634124756e-06, 2.880580723285675e-06, 4.0959566831588745e-06, 5.311332643032074e-06, 6.5267086029052734e-06, 7.742084562778473e-06, 8.957460522651672e-06, 1.0172836482524872e-05, 1.1388212442398071e-05, 1.260358840227127e-05, 1.381896436214447e-05, 1.503434032201767e-05, 1.624971628189087e-05, 1.746509224176407e-05, 1.8680468201637268e-05, 1.9895844161510468e-05, 2.1111220121383667e-05, 2.2326596081256866e-05, 2.3541972041130066e-05, 2.4757348001003265e-05, 2.5972723960876465e-05, 2.7188099920749664e-05, 2.8403475880622864e-05, 2.9618851840496063e-05, 3.083422780036926e-05, 3.204960376024246e-05, 3.326497972011566e-05, 3.448035567998886e-05, 3.569573163986206e-05, 3.691110759973526e-05, 3.812648355960846e-05, 3.934185951948166e-05, 4.055723547935486e-05, 4.177261143922806e-05, 4.298798739910126e-05, 4.420336335897446e-05, 4.5418739318847656e-05]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 1.0, 3.0, 3.0, 6.0, 9.0, 5.0, 12.0, 20.0, 32.0, 50.0, 111.0, 202.0, 550.0, 1877.0, 12146.0, 764591.0, 259361.0, 7357.0, 1432.0, 407.0, 160.0, 72.0, 50.0, 32.0, 20.0, 15.0, 9.0, 7.0, 7.0, 2.0, 3.0, 0.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.5498046875, -0.5335807800292969, -0.5173568725585938, -0.5011329650878906, -0.4849090576171875, -0.4686851501464844, -0.45246124267578125, -0.4362373352050781, -0.420013427734375, -0.4037895202636719, -0.38756561279296875, -0.3713417053222656, -0.3551177978515625, -0.3388938903808594, -0.32266998291015625, -0.3064460754394531, -0.29022216796875, -0.2739982604980469, -0.25777435302734375, -0.24155044555664062, -0.2253265380859375, -0.20910263061523438, -0.19287872314453125, -0.17665481567382812, -0.160430908203125, -0.14420700073242188, -0.12798309326171875, -0.11175918579101562, -0.0955352783203125, -0.07931137084960938, -0.06308746337890625, -0.046863555908203125, -0.0306396484375, -0.014415740966796875, 0.00180816650390625, 0.018032073974609375, 0.0342559814453125, 0.050479888916015625, 0.06670379638671875, 0.08292770385742188, 0.099151611328125, 0.11537551879882812, 0.13159942626953125, 0.14782333374023438, 0.1640472412109375, 0.18027114868164062, 0.19649505615234375, 0.21271896362304688, 0.22894287109375, 0.24516677856445312, 0.26139068603515625, 0.2776145935058594, 0.2938385009765625, 0.3100624084472656, 0.32628631591796875, 0.3425102233886719, 0.358734130859375, 0.3749580383300781, 0.39118194580078125, 0.4074058532714844, 0.4236297607421875, 0.4398536682128906, 0.45607757568359375, 0.4723014831542969, 0.488525390625]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 9.0, 8.0, 4.0, 10.0, 13.0, 14.0, 22.0, 27.0, 43.0, 46.0, 71.0, 97.0, 131.0, 117.0, 103.0, 78.0, 58.0, 37.0, 32.0, 16.0, 17.0, 8.0, 9.0, 7.0, 9.0, 2.0, 2.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08319091796875, -0.08021831512451172, -0.07724571228027344, -0.07427310943603516, -0.07130050659179688, -0.0683279037475586, -0.06535530090332031, -0.06238269805908203, -0.05941009521484375, -0.05643749237060547, -0.05346488952636719, -0.050492286682128906, -0.047519683837890625, -0.044547080993652344, -0.04157447814941406, -0.03860187530517578, -0.0356292724609375, -0.03265666961669922, -0.029684066772460938, -0.026711463928222656, -0.023738861083984375, -0.020766258239746094, -0.017793655395507812, -0.014821052551269531, -0.01184844970703125, -0.008875846862792969, -0.0059032440185546875, -0.0029306411743164062, 4.1961669921875e-05, 0.0030145645141601562, 0.0059871673583984375, 0.008959770202636719, 0.011932373046875, 0.014904975891113281, 0.017877578735351562, 0.020850181579589844, 0.023822784423828125, 0.026795387268066406, 0.029767990112304688, 0.03274059295654297, 0.03571319580078125, 0.03868579864501953, 0.04165840148925781, 0.044631004333496094, 0.047603607177734375, 0.050576210021972656, 0.05354881286621094, 0.05652141571044922, 0.0594940185546875, 0.06246662139892578, 0.06543922424316406, 0.06841182708740234, 0.07138442993164062, 0.0743570327758789, 0.07732963562011719, 0.08030223846435547, 0.08327484130859375, 0.08624744415283203, 0.08922004699707031, 0.0921926498413086, 0.09516525268554688, 0.09813785552978516, 0.10111045837402344, 0.10408306121826172, 0.1070556640625]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 17.0, 44.0, 110.0, 274.0, 291.0, 169.0, 57.0, 32.0, 7.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.430222511291504, -4.327600002288818, -4.224977493286133, -4.122354984283447, -4.019732475280762, -3.917109966278076, -3.8144874572753906, -3.711864948272705, -3.6092424392700195, -3.506619930267334, -3.4039974212646484, -3.301374912261963, -3.1987524032592773, -3.096129894256592, -2.9935073852539062, -2.8908848762512207, -2.788262367248535, -2.6856398582458496, -2.583017349243164, -2.4803948402404785, -2.377772331237793, -2.2751498222351074, -2.172527313232422, -2.0699048042297363, -1.9672820568084717, -1.8646595478057861, -1.7620370388031006, -1.659414529800415, -1.5567920207977295, -1.454169511795044, -1.3515470027923584, -1.2489244937896729, -1.1463019847869873, -1.0436794757843018, -0.9410569667816162, -0.8384344577789307, -0.7358119487762451, -0.6331893801689148, -0.5305668711662292, -0.4279443621635437, -0.32532185316085815, -0.2226993441581726, -0.12007682025432587, -0.017454296350479126, 0.08516821265220642, 0.18779075145721436, 0.2904132604598999, 0.39303576946258545, 0.495658278465271, 0.5982807874679565, 0.7009032964706421, 0.8035258054733276, 0.9061483144760132, 1.0087709426879883, 1.1113934516906738, 1.2140159606933594, 1.316638469696045, 1.4192609786987305, 1.521883487701416, 1.6245059967041016, 1.727128505706787, 1.8297510147094727, 1.9323735237121582, 2.0349960327148438, 2.1376185417175293]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 2.0, 9.0, 9.0, 7.0, 14.0, 9.0, 13.0, 12.0, 18.0, 18.0, 21.0, 34.0, 30.0, 42.0, 41.0, 43.0, 53.0, 46.0, 41.0, 45.0, 40.0, 44.0, 54.0, 38.0, 47.0, 32.0, 41.0, 30.0, 27.0, 19.0, 18.0, 25.0, 12.0, 15.0, 17.0, 8.0, 7.0, 8.0, 7.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0], "bins": [-1.7526599168777466, -1.7049481868743896, -1.6572365760803223, -1.6095249652862549, -1.561813235282898, -1.514101505279541, -1.4663898944854736, -1.4186782836914062, -1.3709665536880493, -1.3232548236846924, -1.275543212890625, -1.2278316020965576, -1.1801198720932007, -1.1324081420898438, -1.0846965312957764, -1.036984920501709, -0.989273190498352, -0.9415615200996399, -0.8938498497009277, -0.8461381793022156, -0.7984265089035034, -0.7507148385047913, -0.7030031681060791, -0.6552914977073669, -0.6075798273086548, -0.5598681569099426, -0.5121564865112305, -0.4644448161125183, -0.41673314571380615, -0.369021475315094, -0.32130980491638184, -0.2735981345176697, -0.22588646411895752, -0.17817479372024536, -0.1304631233215332, -0.08275145292282104, -0.03503978252410889, 0.012671887874603271, 0.06038355827331543, 0.10809522867202759, 0.15580689907073975, 0.2035185694694519, 0.25123023986816406, 0.2989419102668762, 0.3466535806655884, 0.39436525106430054, 0.4420769214630127, 0.48978859186172485, 0.537500262260437, 0.5852119326591492, 0.6329236030578613, 0.6806352734565735, 0.7283469438552856, 0.7760586142539978, 0.82377028465271, 0.8714819550514221, 0.9191936254501343, 0.9669052958488464, 1.0146169662475586, 1.062328577041626, 1.110040307044983, 1.1577520370483398, 1.2054636478424072, 1.2531752586364746, 1.3008869886398315]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 7.0, 12.0, 13.0, 18.0, 37.0, 50.0, 93.0, 183.0, 298.0, 594.0, 1428.0, 4946.0, 43075.0, 2128690.0, 1965655.0, 41991.0, 4565.0, 1374.0, 587.0, 284.0, 160.0, 89.0, 45.0, 30.0, 24.0, 11.0, 8.0, 5.0, 6.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.25390625, -1.2106475830078125, -1.167388916015625, -1.1241302490234375, -1.08087158203125, -1.0376129150390625, -0.994354248046875, -0.9510955810546875, -0.9078369140625, -0.8645782470703125, -0.821319580078125, -0.7780609130859375, -0.73480224609375, -0.6915435791015625, -0.648284912109375, -0.6050262451171875, -0.561767578125, -0.5185089111328125, -0.475250244140625, -0.4319915771484375, -0.38873291015625, -0.3454742431640625, -0.302215576171875, -0.2589569091796875, -0.2156982421875, -0.1724395751953125, -0.129180908203125, -0.0859222412109375, -0.04266357421875, 0.0005950927734375, 0.043853759765625, 0.0871124267578125, 0.13037109375, 0.1736297607421875, 0.216888427734375, 0.2601470947265625, 0.30340576171875, 0.3466644287109375, 0.389923095703125, 0.4331817626953125, 0.4764404296875, 0.5196990966796875, 0.562957763671875, 0.6062164306640625, 0.64947509765625, 0.6927337646484375, 0.735992431640625, 0.7792510986328125, 0.822509765625, 0.8657684326171875, 0.909027099609375, 0.9522857666015625, 0.99554443359375, 1.0388031005859375, 1.082061767578125, 1.1253204345703125, 1.1685791015625, 1.2118377685546875, 1.255096435546875, 1.2983551025390625, 1.34161376953125, 1.3848724365234375, 1.428131103515625, 1.4713897705078125, 1.5146484375]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 8.0, 5.0, 5.0, 14.0, 19.0, 9.0, 11.0, 20.0, 25.0, 25.0, 36.0, 38.0, 44.0, 56.0, 50.0, 60.0, 55.0, 71.0, 56.0, 57.0, 48.0, 43.0, 34.0, 46.0, 30.0, 29.0, 23.0, 17.0, 16.0, 8.0, 9.0, 12.0, 4.0, 5.0, 3.0, 1.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5341796875, -0.5176239013671875, -0.501068115234375, -0.4845123291015625, -0.46795654296875, -0.4514007568359375, -0.434844970703125, -0.4182891845703125, -0.4017333984375, -0.3851776123046875, -0.368621826171875, -0.3520660400390625, -0.33551025390625, -0.3189544677734375, -0.302398681640625, -0.2858428955078125, -0.269287109375, -0.2527313232421875, -0.236175537109375, -0.2196197509765625, -0.20306396484375, -0.1865081787109375, -0.169952392578125, -0.1533966064453125, -0.1368408203125, -0.1202850341796875, -0.103729248046875, -0.0871734619140625, -0.07061767578125, -0.0540618896484375, -0.037506103515625, -0.0209503173828125, -0.00439453125, 0.0121612548828125, 0.028717041015625, 0.0452728271484375, 0.06182861328125, 0.0783843994140625, 0.094940185546875, 0.1114959716796875, 0.1280517578125, 0.1446075439453125, 0.161163330078125, 0.1777191162109375, 0.19427490234375, 0.2108306884765625, 0.227386474609375, 0.2439422607421875, 0.260498046875, 0.2770538330078125, 0.293609619140625, 0.3101654052734375, 0.32672119140625, 0.3432769775390625, 0.359832763671875, 0.3763885498046875, 0.3929443359375, 0.4095001220703125, 0.426055908203125, 0.4426116943359375, 0.45916748046875, 0.4757232666015625, 0.492279052734375, 0.5088348388671875, 0.525390625]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 11.0, 5.0, 5.0, 8.0, 13.0, 11.0, 17.0, 18.0, 23.0, 42.0, 61.0, 109.0, 124.0, 222.0, 354.0, 593.0, 1047.0, 1981.0, 5218.0, 16489.0, 81871.0, 1030515.0, 2821920.0, 190676.0, 29363.0, 7644.0, 2808.0, 1323.0, 676.0, 372.0, 239.0, 158.0, 109.0, 75.0, 55.0, 38.0, 26.0, 25.0, 12.0, 4.0, 10.0, 4.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.68115234375, -0.6606369018554688, -0.6401214599609375, -0.6196060180664062, -0.599090576171875, -0.5785751342773438, -0.5580596923828125, -0.5375442504882812, -0.51702880859375, -0.49651336669921875, -0.4759979248046875, -0.45548248291015625, -0.434967041015625, -0.41445159912109375, -0.3939361572265625, -0.37342071533203125, -0.3529052734375, -0.33238983154296875, -0.3118743896484375, -0.29135894775390625, -0.270843505859375, -0.25032806396484375, -0.2298126220703125, -0.20929718017578125, -0.18878173828125, -0.16826629638671875, -0.1477508544921875, -0.12723541259765625, -0.106719970703125, -0.08620452880859375, -0.0656890869140625, -0.04517364501953125, -0.024658203125, -0.00414276123046875, 0.0163726806640625, 0.03688812255859375, 0.057403564453125, 0.07791900634765625, 0.0984344482421875, 0.11894989013671875, 0.13946533203125, 0.15998077392578125, 0.1804962158203125, 0.20101165771484375, 0.221527099609375, 0.24204254150390625, 0.2625579833984375, 0.28307342529296875, 0.3035888671875, 0.32410430908203125, 0.3446197509765625, 0.36513519287109375, 0.385650634765625, 0.40616607666015625, 0.4266815185546875, 0.44719696044921875, 0.46771240234375, 0.48822784423828125, 0.5087432861328125, 0.5292587280273438, 0.549774169921875, 0.5702896118164062, 0.5908050537109375, 0.6113204956054688, 0.6318359375]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 13.0, 5.0, 8.0, 14.0, 18.0, 19.0, 23.0, 24.0, 62.0, 69.0, 93.0, 140.0, 203.0, 324.0, 472.0, 510.0, 531.0, 446.0, 315.0, 224.0, 159.0, 98.0, 74.0, 64.0, 41.0, 18.0, 33.0, 15.0, 17.0, 9.0, 5.0, 8.0, 3.0, 4.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1910400390625, -0.18543243408203125, -0.1798248291015625, -0.17421722412109375, -0.168609619140625, -0.16300201416015625, -0.1573944091796875, -0.15178680419921875, -0.14617919921875, -0.14057159423828125, -0.1349639892578125, -0.12935638427734375, -0.123748779296875, -0.11814117431640625, -0.1125335693359375, -0.10692596435546875, -0.101318359375, -0.09571075439453125, -0.0901031494140625, -0.08449554443359375, -0.078887939453125, -0.07328033447265625, -0.0676727294921875, -0.06206512451171875, -0.05645751953125, -0.05084991455078125, -0.0452423095703125, -0.03963470458984375, -0.034027099609375, -0.02841949462890625, -0.0228118896484375, -0.01720428466796875, -0.0115966796875, -0.00598907470703125, -0.0003814697265625, 0.00522613525390625, 0.010833740234375, 0.01644134521484375, 0.0220489501953125, 0.02765655517578125, 0.03326416015625, 0.03887176513671875, 0.0444793701171875, 0.05008697509765625, 0.055694580078125, 0.06130218505859375, 0.0669097900390625, 0.07251739501953125, 0.078125, 0.08373260498046875, 0.0893402099609375, 0.09494781494140625, 0.100555419921875, 0.10616302490234375, 0.1117706298828125, 0.11737823486328125, 0.12298583984375, 0.12859344482421875, 0.1342010498046875, 0.13980865478515625, 0.145416259765625, 0.15102386474609375, 0.1566314697265625, 0.16223907470703125, 0.1678466796875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 12.0, 27.0, 59.0, 123.0, 233.0, 260.0, 137.0, 93.0, 28.0, 17.0, 9.0, 6.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.063856840133667, -3.0026767253875732, -2.9414968490600586, -2.880316734313965, -2.81913685798645, -2.7579567432403564, -2.6967766284942627, -2.635596752166748, -2.5744166374206543, -2.5132365226745605, -2.452056646347046, -2.390876531600952, -2.3296966552734375, -2.2685165405273438, -2.20733642578125, -2.1461565494537354, -2.0849764347076416, -2.023796319961548, -1.9626164436340332, -1.9014363288879395, -1.8402563333511353, -1.779076337814331, -1.7178963422775269, -1.6567163467407227, -1.5955363512039185, -1.5343563556671143, -1.47317636013031, -1.4119962453842163, -1.350816249847412, -1.289636254310608, -1.2284562587738037, -1.16727614402771, -1.1060962677001953, -1.0449162721633911, -0.9837362170219421, -0.9225562214851379, -0.861376166343689, -0.8001961708068848, -0.7390161752700806, -0.6778361201286316, -0.6166560649871826, -0.5554760694503784, -0.49429601430892944, -0.43311601877212524, -0.37193596363067627, -0.31075596809387207, -0.24957594275474548, -0.1883959174156189, -0.12721586227416992, -0.06603583693504333, -0.004855819046497345, 0.056324198842048645, 0.11750422418117523, 0.17868423461914062, 0.2398642599582672, 0.3010442852973938, 0.3622243106365204, 0.423404335975647, 0.48458436131477356, 0.5457643866539001, 0.6069443821907043, 0.6681244373321533, 0.7293044328689575, 0.7904844284057617, 0.8516644835472107]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 4.0, 2.0, 1.0, 5.0, 4.0, 6.0, 8.0, 12.0, 12.0, 16.0, 9.0, 25.0, 20.0, 18.0, 27.0, 52.0, 34.0, 47.0, 54.0, 50.0, 70.0, 56.0, 59.0, 46.0, 58.0, 44.0, 43.0, 49.0, 35.0, 24.0, 26.0, 17.0, 16.0, 12.0, 11.0, 12.0, 9.0, 6.0, 5.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.6152368783950806, -0.5964518785476685, -0.5776668787002563, -0.5588818788528442, -0.5400968790054321, -0.5213118195533752, -0.5025268197059631, -0.483741819858551, -0.4649568200111389, -0.4461718201637268, -0.4273868203163147, -0.4086017906665802, -0.3898167908191681, -0.371031790971756, -0.3522467613220215, -0.3334617614746094, -0.31467676162719727, -0.29589176177978516, -0.27710676193237305, -0.25832173228263855, -0.23953673243522644, -0.22075173258781433, -0.20196671783924103, -0.18318170309066772, -0.16439670324325562, -0.1456117033958435, -0.1268266886472702, -0.1080416813492775, -0.08925667405128479, -0.07047166675329208, -0.05168665945529938, -0.032901644706726074, -0.01411658525466919, 0.004668422043323517, 0.023453429341316223, 0.04223843663930893, 0.061023443937301636, 0.07980845123529434, 0.09859345853328705, 0.11737847328186035, 0.13616347312927246, 0.15494847297668457, 0.17373348772525787, 0.19251850247383118, 0.2113035023212433, 0.2300885021686554, 0.2488735169172287, 0.267658531665802, 0.2864435315132141, 0.3052285313606262, 0.32401353120803833, 0.3427985608577728, 0.36158356070518494, 0.38036856055259705, 0.39915359020233154, 0.41793859004974365, 0.43672358989715576, 0.45550858974456787, 0.47429358959198, 0.4930786192417145, 0.5118635892868042, 0.5306486487388611, 0.5494336485862732, 0.5682186484336853, 0.5870036482810974]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 8.0, 10.0, 12.0, 26.0, 46.0, 50.0, 80.0, 177.0, 389.0, 1126.0, 4230.0, 20761.0, 124859.0, 510649.0, 318027.0, 54632.0, 9896.0, 2284.0, 665.0, 278.0, 130.0, 79.0, 50.0, 28.0, 17.0, 15.0, 14.0, 10.0, 3.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1705322265625, -0.16562843322753906, -0.16072463989257812, -0.1558208465576172, -0.15091705322265625, -0.1460132598876953, -0.14110946655273438, -0.13620567321777344, -0.1313018798828125, -0.12639808654785156, -0.12149429321289062, -0.11659049987792969, -0.11168670654296875, -0.10678291320800781, -0.10187911987304688, -0.09697532653808594, -0.092071533203125, -0.08716773986816406, -0.08226394653320312, -0.07736015319824219, -0.07245635986328125, -0.06755256652832031, -0.06264877319335938, -0.05774497985839844, -0.0528411865234375, -0.04793739318847656, -0.043033599853515625, -0.03812980651855469, -0.03322601318359375, -0.028322219848632812, -0.023418426513671875, -0.018514633178710938, -0.01361083984375, -0.008707046508789062, -0.003803253173828125, 0.0011005401611328125, 0.00600433349609375, 0.010908126831054688, 0.015811920166015625, 0.020715713500976562, 0.0256195068359375, 0.030523300170898438, 0.035427093505859375, 0.04033088684082031, 0.04523468017578125, 0.05013847351074219, 0.055042266845703125, 0.05994606018066406, 0.064849853515625, 0.06975364685058594, 0.07465744018554688, 0.07956123352050781, 0.08446502685546875, 0.08936882019042969, 0.09427261352539062, 0.09917640686035156, 0.1040802001953125, 0.10898399353027344, 0.11388778686523438, 0.11879158020019531, 0.12369537353515625, 0.1285991668701172, 0.13350296020507812, 0.13840675354003906, 0.143310546875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 1.0, 4.0, 3.0, 9.0, 15.0, 11.0, 16.0, 17.0, 23.0, 33.0, 48.0, 46.0, 72.0, 79.0, 87.0, 99.0, 87.0, 58.0, 69.0, 56.0, 49.0, 25.0, 27.0, 17.0, 21.0, 13.0, 12.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.458740234375, -0.4406242370605469, -0.42250823974609375, -0.4043922424316406, -0.3862762451171875, -0.3681602478027344, -0.35004425048828125, -0.3319282531738281, -0.313812255859375, -0.2956962585449219, -0.27758026123046875, -0.2594642639160156, -0.2413482666015625, -0.22323226928710938, -0.20511627197265625, -0.18700027465820312, -0.16888427734375, -0.15076828002929688, -0.13265228271484375, -0.11453628540039062, -0.0964202880859375, -0.07830429077148438, -0.06018829345703125, -0.042072296142578125, -0.023956298828125, -0.005840301513671875, 0.01227569580078125, 0.030391693115234375, 0.0485076904296875, 0.06662368774414062, 0.08473968505859375, 0.10285568237304688, 0.1209716796875, 0.13908767700195312, 0.15720367431640625, 0.17531967163085938, 0.1934356689453125, 0.21155166625976562, 0.22966766357421875, 0.24778366088867188, 0.265899658203125, 0.2840156555175781, 0.30213165283203125, 0.3202476501464844, 0.3383636474609375, 0.3564796447753906, 0.37459564208984375, 0.3927116394042969, 0.41082763671875, 0.4289436340332031, 0.44705963134765625, 0.4651756286621094, 0.4832916259765625, 0.5014076232910156, 0.5195236206054688, 0.5376396179199219, 0.555755615234375, 0.5738716125488281, 0.5919876098632812, 0.6101036071777344, 0.6282196044921875, 0.6463356018066406, 0.6644515991210938, 0.6825675964355469, 0.70068359375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 8.0, 4.0, 9.0, 13.0, 16.0, 20.0, 28.0, 47.0, 49.0, 87.0, 115.0, 149.0, 264.0, 381.0, 590.0, 1065.0, 1773.0, 3590.0, 6652.0, 13870.0, 29026.0, 62380.0, 128140.0, 221112.0, 247492.0, 167976.0, 84936.0, 40279.0, 18861.0, 9196.0, 4590.0, 2359.0, 1354.0, 763.0, 425.0, 274.0, 180.0, 130.0, 96.0, 76.0, 48.0, 30.0, 28.0, 18.0, 21.0, 5.0, 9.0, 11.0, 7.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06072998046875, -0.05878448486328125, -0.0568389892578125, -0.05489349365234375, -0.052947998046875, -0.05100250244140625, -0.0490570068359375, -0.04711151123046875, -0.045166015625, -0.04322052001953125, -0.0412750244140625, -0.03932952880859375, -0.037384033203125, -0.03543853759765625, -0.0334930419921875, -0.03154754638671875, -0.02960205078125, -0.02765655517578125, -0.0257110595703125, -0.02376556396484375, -0.021820068359375, -0.01987457275390625, -0.0179290771484375, -0.01598358154296875, -0.0140380859375, -0.01209259033203125, -0.0101470947265625, -0.00820159912109375, -0.006256103515625, -0.00431060791015625, -0.0023651123046875, -0.00041961669921875, 0.00152587890625, 0.00347137451171875, 0.0054168701171875, 0.00736236572265625, 0.009307861328125, 0.01125335693359375, 0.0131988525390625, 0.01514434814453125, 0.01708984375, 0.01903533935546875, 0.0209808349609375, 0.02292633056640625, 0.024871826171875, 0.02681732177734375, 0.0287628173828125, 0.03070831298828125, 0.03265380859375, 0.03459930419921875, 0.0365447998046875, 0.03849029541015625, 0.040435791015625, 0.04238128662109375, 0.0443267822265625, 0.04627227783203125, 0.0482177734375, 0.05016326904296875, 0.0521087646484375, 0.05405426025390625, 0.055999755859375, 0.05794525146484375, 0.0598907470703125, 0.06183624267578125, 0.06378173828125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0, 3.0, 7.0, 2.0, 3.0, 7.0, 4.0, 9.0, 10.0, 18.0, 10.0, 21.0, 11.0, 21.0, 27.0, 24.0, 31.0, 41.0, 47.0, 37.0, 52.0, 52.0, 48.0, 63.0, 44.0, 38.0, 49.0, 35.0, 45.0, 43.0, 23.0, 33.0, 14.0, 25.0, 20.0, 19.0, 8.0, 7.0, 14.0, 6.0, 8.0, 5.0, 2.0, 8.0, 3.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.69921875, -0.6778106689453125, -0.656402587890625, -0.6349945068359375, -0.61358642578125, -0.5921783447265625, -0.570770263671875, -0.5493621826171875, -0.5279541015625, -0.5065460205078125, -0.485137939453125, -0.4637298583984375, -0.44232177734375, -0.4209136962890625, -0.399505615234375, -0.3780975341796875, -0.356689453125, -0.3352813720703125, -0.313873291015625, -0.2924652099609375, -0.27105712890625, -0.2496490478515625, -0.228240966796875, -0.2068328857421875, -0.1854248046875, -0.1640167236328125, -0.142608642578125, -0.1212005615234375, -0.09979248046875, -0.0783843994140625, -0.056976318359375, -0.0355682373046875, -0.01416015625, 0.0072479248046875, 0.028656005859375, 0.0500640869140625, 0.07147216796875, 0.0928802490234375, 0.114288330078125, 0.1356964111328125, 0.1571044921875, 0.1785125732421875, 0.199920654296875, 0.2213287353515625, 0.24273681640625, 0.2641448974609375, 0.285552978515625, 0.3069610595703125, 0.328369140625, 0.3497772216796875, 0.371185302734375, 0.3925933837890625, 0.41400146484375, 0.4354095458984375, 0.456817626953125, 0.4782257080078125, 0.4996337890625, 0.5210418701171875, 0.542449951171875, 0.5638580322265625, 0.58526611328125, 0.6066741943359375, 0.628082275390625, 0.6494903564453125, 0.6708984375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 6.0, 7.0, 5.0, 9.0, 24.0, 33.0, 56.0, 55.0, 92.0, 122.0, 208.0, 363.0, 650.0, 1044.0, 2137.0, 4728.0, 12165.0, 39406.0, 156823.0, 449738.0, 277935.0, 69672.0, 19766.0, 7049.0, 2997.0, 1528.0, 792.0, 432.0, 235.0, 173.0, 114.0, 67.0, 34.0, 29.0, 17.0, 12.0, 9.0, 4.0, 7.0, 1.0, 3.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.032379150390625, -0.03135824203491211, -0.03033733367919922, -0.029316425323486328, -0.028295516967773438, -0.027274608612060547, -0.026253700256347656, -0.025232791900634766, -0.024211883544921875, -0.023190975189208984, -0.022170066833496094, -0.021149158477783203, -0.020128250122070312, -0.019107341766357422, -0.01808643341064453, -0.01706552505493164, -0.01604461669921875, -0.01502370834350586, -0.014002799987792969, -0.012981891632080078, -0.011960983276367188, -0.010940074920654297, -0.009919166564941406, -0.008898258209228516, -0.007877349853515625, -0.006856441497802734, -0.005835533142089844, -0.004814624786376953, -0.0037937164306640625, -0.002772808074951172, -0.0017518997192382812, -0.0007309913635253906, 0.0002899169921875, 0.0013108253479003906, 0.0023317337036132812, 0.003352642059326172, 0.0043735504150390625, 0.005394458770751953, 0.006415367126464844, 0.007436275482177734, 0.008457183837890625, 0.009478092193603516, 0.010499000549316406, 0.011519908905029297, 0.012540817260742188, 0.013561725616455078, 0.014582633972167969, 0.01560354232788086, 0.01662445068359375, 0.01764535903930664, 0.01866626739501953, 0.019687175750732422, 0.020708084106445312, 0.021728992462158203, 0.022749900817871094, 0.023770809173583984, 0.024791717529296875, 0.025812625885009766, 0.026833534240722656, 0.027854442596435547, 0.028875350952148438, 0.029896259307861328, 0.03091716766357422, 0.03193807601928711, 0.032958984375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 7.0, 5.0, 12.0, 16.0, 17.0, 30.0, 40.0, 70.0, 70.0, 85.0, 88.0, 99.0, 97.0, 99.0, 67.0, 62.0, 44.0, 38.0, 22.0, 11.0, 3.0, 10.0, 5.0, 6.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.71661376953125e-05, -1.6568228602409363e-05, -1.5970319509506226e-05, -1.537241041660309e-05, -1.4774501323699951e-05, -1.4176592230796814e-05, -1.3578683137893677e-05, -1.298077404499054e-05, -1.2382864952087402e-05, -1.1784955859184265e-05, -1.1187046766281128e-05, -1.058913767337799e-05, -9.991228580474854e-06, -9.393319487571716e-06, -8.795410394668579e-06, -8.197501301765442e-06, -7.599592208862305e-06, -7.0016831159591675e-06, -6.40377402305603e-06, -5.805864930152893e-06, -5.207955837249756e-06, -4.610046744346619e-06, -4.0121376514434814e-06, -3.4142285585403442e-06, -2.816319465637207e-06, -2.21841037273407e-06, -1.6205012798309326e-06, -1.0225921869277954e-06, -4.246830940246582e-07, 1.73225998878479e-07, 7.711350917816162e-07, 1.3690441846847534e-06, 1.9669532775878906e-06, 2.564862370491028e-06, 3.162771463394165e-06, 3.7606805562973022e-06, 4.3585896492004395e-06, 4.956498742103577e-06, 5.554407835006714e-06, 6.152316927909851e-06, 6.750226020812988e-06, 7.3481351137161255e-06, 7.946044206619263e-06, 8.5439532995224e-06, 9.141862392425537e-06, 9.739771485328674e-06, 1.0337680578231812e-05, 1.0935589671134949e-05, 1.1533498764038086e-05, 1.2131407856941223e-05, 1.272931694984436e-05, 1.3327226042747498e-05, 1.3925135135650635e-05, 1.4523044228553772e-05, 1.512095332145691e-05, 1.5718862414360046e-05, 1.6316771507263184e-05, 1.691468060016632e-05, 1.7512589693069458e-05, 1.8110498785972595e-05, 1.8708407878875732e-05, 1.930631697177887e-05, 1.9904226064682007e-05, 2.0502135157585144e-05, 2.110004425048828e-05]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 3.0, 5.0, 6.0, 5.0, 20.0, 18.0, 24.0, 43.0, 61.0, 64.0, 108.0, 189.0, 316.0, 570.0, 1202.0, 2655.0, 7204.0, 22753.0, 79725.0, 257296.0, 393055.0, 198391.0, 58016.0, 16840.0, 5666.0, 2142.0, 945.0, 468.0, 291.0, 154.0, 102.0, 59.0, 43.0, 40.0, 20.0, 12.0, 14.0, 14.0, 4.0, 5.0, 5.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.031524658203125, -0.03058004379272461, -0.02963542938232422, -0.028690814971923828, -0.027746200561523438, -0.026801586151123047, -0.025856971740722656, -0.024912357330322266, -0.023967742919921875, -0.023023128509521484, -0.022078514099121094, -0.021133899688720703, -0.020189285278320312, -0.019244670867919922, -0.01830005645751953, -0.01735544204711914, -0.01641082763671875, -0.01546621322631836, -0.014521598815917969, -0.013576984405517578, -0.012632369995117188, -0.011687755584716797, -0.010743141174316406, -0.009798526763916016, -0.008853912353515625, -0.007909297943115234, -0.006964683532714844, -0.006020069122314453, -0.0050754547119140625, -0.004130840301513672, -0.0031862258911132812, -0.0022416114807128906, -0.0012969970703125, -0.0003523826599121094, 0.0005922317504882812, 0.0015368461608886719, 0.0024814605712890625, 0.003426074981689453, 0.004370689392089844, 0.005315303802490234, 0.006259918212890625, 0.007204532623291016, 0.008149147033691406, 0.009093761444091797, 0.010038375854492188, 0.010982990264892578, 0.011927604675292969, 0.01287221908569336, 0.01381683349609375, 0.01476144790649414, 0.01570606231689453, 0.016650676727294922, 0.017595291137695312, 0.018539905548095703, 0.019484519958496094, 0.020429134368896484, 0.021373748779296875, 0.022318363189697266, 0.023262977600097656, 0.024207592010498047, 0.025152206420898438, 0.026096820831298828, 0.02704143524169922, 0.02798604965209961, 0.0289306640625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 3.0, 2.0, 5.0, 1.0, 8.0, 11.0, 6.0, 12.0, 15.0, 9.0, 20.0, 29.0, 32.0, 40.0, 40.0, 33.0, 59.0, 59.0, 63.0, 52.0, 52.0, 51.0, 45.0, 64.0, 34.0, 39.0, 36.0, 36.0, 31.0, 12.0, 19.0, 18.0, 23.0, 12.0, 7.0, 3.0, 7.0, 5.0, 3.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.008056640625, -0.007813096046447754, -0.007569551467895508, -0.007326006889343262, -0.007082462310791016, -0.0068389177322387695, -0.0065953731536865234, -0.006351828575134277, -0.006108283996582031, -0.005864739418029785, -0.005621194839477539, -0.005377650260925293, -0.005134105682373047, -0.004890561103820801, -0.004647016525268555, -0.004403471946716309, -0.0041599273681640625, -0.003916382789611816, -0.0036728382110595703, -0.0034292936325073242, -0.003185749053955078, -0.002942204475402832, -0.002698659896850586, -0.00245511531829834, -0.0022115707397460938, -0.0019680261611938477, -0.0017244815826416016, -0.0014809370040893555, -0.0012373924255371094, -0.0009938478469848633, -0.0007503032684326172, -0.0005067586898803711, -0.000263214111328125, -1.9669532775878906e-05, 0.0002238750457763672, 0.0004674196243286133, 0.0007109642028808594, 0.0009545087814331055, 0.0011980533599853516, 0.0014415979385375977, 0.0016851425170898438, 0.0019286870956420898, 0.002172231674194336, 0.002415776252746582, 0.002659320831298828, 0.0029028654098510742, 0.0031464099884033203, 0.0033899545669555664, 0.0036334991455078125, 0.0038770437240600586, 0.004120588302612305, 0.004364132881164551, 0.004607677459716797, 0.004851222038269043, 0.005094766616821289, 0.005338311195373535, 0.005581855773925781, 0.005825400352478027, 0.0060689449310302734, 0.0063124895095825195, 0.006556034088134766, 0.006799578666687012, 0.007043123245239258, 0.007286667823791504, 0.00753021240234375]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 9.0, 167.0, 753.0, 77.0, 10.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.984787940979004, -7.8405842781066895, -7.696380615234375, -7.5521769523620605, -7.407973289489746, -7.263769626617432, -7.119565963745117, -6.975362300872803, -6.831158638000488, -6.686954975128174, -6.542751312255859, -6.398547649383545, -6.2543439865112305, -6.110140323638916, -5.965936660766602, -5.821732997894287, -5.677529335021973, -5.533325672149658, -5.389122009277344, -5.244918346405029, -5.100714683532715, -4.9565110206604, -4.812307357788086, -4.6681036949157715, -4.523899555206299, -4.379695892333984, -4.23549222946167, -4.0912885665893555, -3.947084903717041, -3.8028812408447266, -3.658677577972412, -3.5144739151000977, -3.3702704906463623, -3.226066827774048, -3.0818631649017334, -2.937659502029419, -2.7934558391571045, -2.64925217628479, -2.5050482749938965, -2.360844612121582, -2.2166409492492676, -2.072437286376953, -1.9282336235046387, -1.7840299606323242, -1.6398262977600098, -1.4956226348876953, -1.3514188528060913, -1.2072151899337769, -1.063011646270752, -0.9188079833984375, -0.774604320526123, -0.6304005980491638, -0.48619693517684937, -0.3419932723045349, -0.19778954982757568, -0.05358588695526123, 0.09061777591705322, 0.23482145369052887, 0.3790251314640045, 0.5232288241386414, 0.6674324870109558, 0.8116361498832703, 0.9558398723602295, 1.100043535232544, 1.2442471981048584]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 7.0, 5.0, 7.0, 13.0, 15.0, 17.0, 17.0, 23.0, 21.0, 37.0, 51.0, 42.0, 75.0, 81.0, 71.0, 79.0, 71.0, 70.0, 54.0, 57.0, 40.0, 38.0, 26.0, 20.0, 16.0, 20.0, 7.0, 9.0, 7.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.4294459819793701, -0.4136611819267273, -0.3978763818740845, -0.38209158182144165, -0.36630678176879883, -0.350521981716156, -0.3347371518611908, -0.318952351808548, -0.30316755175590515, -0.28738275170326233, -0.2715979516506195, -0.2558131515979767, -0.24002833664417267, -0.22424353659152985, -0.20845872163772583, -0.192673921585083, -0.17688912153244019, -0.16110432147979736, -0.14531952142715454, -0.12953470647335052, -0.1137499064207077, -0.09796510636806488, -0.08218029886484146, -0.06639549136161804, -0.05061069130897522, -0.0348258875310421, -0.01904108375310898, -0.0032562799751758575, 0.012528523802757263, 0.028313323855400085, 0.044098131358623505, 0.059882938861846924, 0.07566767930984497, 0.09145247936248779, 0.10723728686571121, 0.12302209436893463, 0.13880689442157745, 0.15459169447422028, 0.1703765094280243, 0.18616130948066711, 0.20194610953330994, 0.21773090958595276, 0.23351570963859558, 0.2493005245923996, 0.2650853395462036, 0.28087013959884644, 0.29665493965148926, 0.3124397397041321, 0.3282245397567749, 0.3440093398094177, 0.35979413986206055, 0.37557893991470337, 0.3913637399673462, 0.407148540019989, 0.4229333698749542, 0.43871816992759705, 0.45450296998023987, 0.4702877700328827, 0.4860725700855255, 0.5018573999404907, 0.5176421999931335, 0.5334270000457764, 0.5492118000984192, 0.564996600151062, 0.5807814002037048]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 7.0, 9.0, 12.0, 15.0, 9.0, 24.0, 30.0, 41.0, 72.0, 105.0, 190.0, 268.0, 428.0, 668.0, 1114.0, 2057.0, 4166.0, 8619.0, 19970.0, 53038.0, 169025.0, 415145.0, 247196.0, 76592.0, 26991.0, 11199.0, 5232.0, 2665.0, 1466.0, 840.0, 505.0, 318.0, 170.0, 97.0, 85.0, 59.0, 26.0, 29.0, 21.0, 13.0, 11.0, 11.0, 3.0, 7.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.335693359375, -0.32572174072265625, -0.3157501220703125, -0.30577850341796875, -0.295806884765625, -0.28583526611328125, -0.2758636474609375, -0.26589202880859375, -0.25592041015625, -0.24594879150390625, -0.2359771728515625, -0.22600555419921875, -0.216033935546875, -0.20606231689453125, -0.1960906982421875, -0.18611907958984375, -0.1761474609375, -0.16617584228515625, -0.1562042236328125, -0.14623260498046875, -0.136260986328125, -0.12628936767578125, -0.1163177490234375, -0.10634613037109375, -0.09637451171875, -0.08640289306640625, -0.0764312744140625, -0.06645965576171875, -0.056488037109375, -0.04651641845703125, -0.0365447998046875, -0.02657318115234375, -0.0166015625, -0.00662994384765625, 0.0033416748046875, 0.01331329345703125, 0.023284912109375, 0.03325653076171875, 0.0432281494140625, 0.05319976806640625, 0.06317138671875, 0.07314300537109375, 0.0831146240234375, 0.09308624267578125, 0.103057861328125, 0.11302947998046875, 0.1230010986328125, 0.13297271728515625, 0.1429443359375, 0.15291595458984375, 0.1628875732421875, 0.17285919189453125, 0.182830810546875, 0.19280242919921875, 0.2027740478515625, 0.21274566650390625, 0.22271728515625, 0.23268890380859375, 0.2426605224609375, 0.25263214111328125, 0.262603759765625, 0.27257537841796875, 0.2825469970703125, 0.29251861572265625, 0.302490234375]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 3.0, 6.0, 4.0, 4.0, 5.0, 8.0, 3.0, 14.0, 13.0, 13.0, 15.0, 21.0, 17.0, 22.0, 27.0, 33.0, 43.0, 49.0, 40.0, 57.0, 65.0, 55.0, 55.0, 66.0, 45.0, 55.0, 41.0, 25.0, 37.0, 32.0, 24.0, 22.0, 15.0, 17.0, 16.0, 13.0, 5.0, 5.0, 4.0, 2.0, 4.0, 1.0, 2.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.8583984375, -0.8349456787109375, -0.811492919921875, -0.7880401611328125, -0.76458740234375, -0.7411346435546875, -0.717681884765625, -0.6942291259765625, -0.6707763671875, -0.6473236083984375, -0.623870849609375, -0.6004180908203125, -0.57696533203125, -0.5535125732421875, -0.530059814453125, -0.5066070556640625, -0.483154296875, -0.4597015380859375, -0.436248779296875, -0.4127960205078125, -0.38934326171875, -0.3658905029296875, -0.342437744140625, -0.3189849853515625, -0.2955322265625, -0.2720794677734375, -0.248626708984375, -0.2251739501953125, -0.20172119140625, -0.1782684326171875, -0.154815673828125, -0.1313629150390625, -0.10791015625, -0.0844573974609375, -0.061004638671875, -0.0375518798828125, -0.01409912109375, 0.0093536376953125, 0.032806396484375, 0.0562591552734375, 0.0797119140625, 0.1031646728515625, 0.126617431640625, 0.1500701904296875, 0.17352294921875, 0.1969757080078125, 0.220428466796875, 0.2438812255859375, 0.267333984375, 0.2907867431640625, 0.314239501953125, 0.3376922607421875, 0.36114501953125, 0.3845977783203125, 0.408050537109375, 0.4315032958984375, 0.4549560546875, 0.4784088134765625, 0.501861572265625, 0.5253143310546875, 0.54876708984375, 0.5722198486328125, 0.595672607421875, 0.6191253662109375, 0.642578125]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 6.0, 6.0, 4.0, 13.0, 14.0, 18.0, 16.0, 39.0, 63.0, 123.0, 197.0, 494.0, 2044.0, 39623.0, 952473.0, 50160.0, 2231.0, 540.0, 209.0, 92.0, 57.0, 40.0, 32.0, 19.0, 16.0, 8.0, 6.0, 8.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.08203125, -1.042724609375, -1.00341796875, -0.964111328125, -0.9248046875, -0.885498046875, -0.84619140625, -0.806884765625, -0.767578125, -0.728271484375, -0.68896484375, -0.649658203125, -0.6103515625, -0.571044921875, -0.53173828125, -0.492431640625, -0.453125, -0.413818359375, -0.37451171875, -0.335205078125, -0.2958984375, -0.256591796875, -0.21728515625, -0.177978515625, -0.138671875, -0.099365234375, -0.06005859375, -0.020751953125, 0.0185546875, 0.057861328125, 0.09716796875, 0.136474609375, 0.17578125, 0.215087890625, 0.25439453125, 0.293701171875, 0.3330078125, 0.372314453125, 0.41162109375, 0.450927734375, 0.490234375, 0.529541015625, 0.56884765625, 0.608154296875, 0.6474609375, 0.686767578125, 0.72607421875, 0.765380859375, 0.8046875, 0.843994140625, 0.88330078125, 0.922607421875, 0.9619140625, 1.001220703125, 1.04052734375, 1.079833984375, 1.119140625, 1.158447265625, 1.19775390625, 1.237060546875, 1.2763671875, 1.315673828125, 1.35498046875, 1.394287109375, 1.43359375]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 5.0, 1.0, 2.0, 6.0, 7.0, 11.0, 11.0, 17.0, 16.0, 19.0, 27.0, 25.0, 22.0, 27.0, 35.0, 44.0, 42.0, 24.0, 42.0, 57.0, 36.0, 46.0, 47.0, 49.0, 48.0, 37.0, 36.0, 35.0, 28.0, 31.0, 33.0, 19.0, 25.0, 17.0, 11.0, 15.0, 14.0, 10.0, 6.0, 8.0, 5.0, 5.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.81640625, -0.7922134399414062, -0.7680206298828125, -0.7438278198242188, -0.719635009765625, -0.6954421997070312, -0.6712493896484375, -0.6470565795898438, -0.62286376953125, -0.5986709594726562, -0.5744781494140625, -0.5502853393554688, -0.526092529296875, -0.5018997192382812, -0.4777069091796875, -0.45351409912109375, -0.4293212890625, -0.40512847900390625, -0.3809356689453125, -0.35674285888671875, -0.332550048828125, -0.30835723876953125, -0.2841644287109375, -0.25997161865234375, -0.23577880859375, -0.21158599853515625, -0.1873931884765625, -0.16320037841796875, -0.139007568359375, -0.11481475830078125, -0.0906219482421875, -0.06642913818359375, -0.042236328125, -0.01804351806640625, 0.0061492919921875, 0.03034210205078125, 0.054534912109375, 0.07872772216796875, 0.1029205322265625, 0.12711334228515625, 0.15130615234375, 0.17549896240234375, 0.1996917724609375, 0.22388458251953125, 0.248077392578125, 0.27227020263671875, 0.2964630126953125, 0.32065582275390625, 0.3448486328125, 0.36904144287109375, 0.3932342529296875, 0.41742706298828125, 0.441619873046875, 0.46581268310546875, 0.4900054931640625, 0.5141983032226562, 0.53839111328125, 0.5625839233398438, 0.5867767333984375, 0.6109695434570312, 0.635162353515625, 0.6593551635742188, 0.6835479736328125, 0.7077407836914062, 0.73193359375]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 4.0, 0.0, 2.0, 1.0, 2.0, 7.0, 9.0, 19.0, 34.0, 84.0, 158.0, 458.0, 1627.0, 10430.0, 895634.0, 134281.0, 4337.0, 892.0, 317.0, 117.0, 54.0, 29.0, 14.0, 9.0, 5.0, 8.0, 6.0, 5.0, 4.0, 1.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.494384765625, -0.4766044616699219, -0.45882415771484375, -0.4410438537597656, -0.4232635498046875, -0.4054832458496094, -0.38770294189453125, -0.3699226379394531, -0.352142333984375, -0.3343620300292969, -0.31658172607421875, -0.2988014221191406, -0.2810211181640625, -0.2632408142089844, -0.24546051025390625, -0.22768020629882812, -0.20989990234375, -0.19211959838867188, -0.17433929443359375, -0.15655899047851562, -0.1387786865234375, -0.12099838256835938, -0.10321807861328125, -0.08543777465820312, -0.067657470703125, -0.049877166748046875, -0.03209686279296875, -0.014316558837890625, 0.0034637451171875, 0.021244049072265625, 0.03902435302734375, 0.056804656982421875, 0.0745849609375, 0.09236526489257812, 0.11014556884765625, 0.12792587280273438, 0.1457061767578125, 0.16348648071289062, 0.18126678466796875, 0.19904708862304688, 0.216827392578125, 0.23460769653320312, 0.25238800048828125, 0.2701683044433594, 0.2879486083984375, 0.3057289123535156, 0.32350921630859375, 0.3412895202636719, 0.35906982421875, 0.3768501281738281, 0.39463043212890625, 0.4124107360839844, 0.4301910400390625, 0.4479713439941406, 0.46575164794921875, 0.4835319519042969, 0.501312255859375, 0.5190925598144531, 0.5368728637695312, 0.5546531677246094, 0.5724334716796875, 0.5902137756347656, 0.6079940795898438, 0.6257743835449219, 0.6435546875]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 4.0, 9.0, 10.0, 10.0, 25.0, 33.0, 58.0, 95.0, 153.0, 182.0, 167.0, 100.0, 63.0, 30.0, 18.0, 19.0, 9.0, 11.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.863739013671875e-05, -4.7147274017333984e-05, -4.565715789794922e-05, -4.416704177856445e-05, -4.267692565917969e-05, -4.118680953979492e-05, -3.9696693420410156e-05, -3.820657730102539e-05, -3.6716461181640625e-05, -3.522634506225586e-05, -3.3736228942871094e-05, -3.224611282348633e-05, -3.075599670410156e-05, -2.9265880584716797e-05, -2.777576446533203e-05, -2.6285648345947266e-05, -2.47955322265625e-05, -2.3305416107177734e-05, -2.181529998779297e-05, -2.0325183868408203e-05, -1.8835067749023438e-05, -1.7344951629638672e-05, -1.5854835510253906e-05, -1.436471939086914e-05, -1.2874603271484375e-05, -1.138448715209961e-05, -9.894371032714844e-06, -8.404254913330078e-06, -6.9141387939453125e-06, -5.424022674560547e-06, -3.933906555175781e-06, -2.4437904357910156e-06, -9.5367431640625e-07, 5.364418029785156e-07, 2.0265579223632812e-06, 3.516674041748047e-06, 5.0067901611328125e-06, 6.496906280517578e-06, 7.987022399902344e-06, 9.47713851928711e-06, 1.0967254638671875e-05, 1.245737075805664e-05, 1.3947486877441406e-05, 1.5437602996826172e-05, 1.6927719116210938e-05, 1.8417835235595703e-05, 1.990795135498047e-05, 2.1398067474365234e-05, 2.288818359375e-05, 2.4378299713134766e-05, 2.586841583251953e-05, 2.7358531951904297e-05, 2.8848648071289062e-05, 3.0338764190673828e-05, 3.1828880310058594e-05, 3.331899642944336e-05, 3.4809112548828125e-05, 3.629922866821289e-05, 3.7789344787597656e-05, 3.927946090698242e-05, 4.076957702636719e-05, 4.225969314575195e-05, 4.374980926513672e-05, 4.5239925384521484e-05, 4.673004150390625e-05]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 3.0, 10.0, 4.0, 11.0, 17.0, 22.0, 35.0, 69.0, 109.0, 218.0, 532.0, 1424.0, 6051.0, 95980.0, 909639.0, 28870.0, 3649.0, 1049.0, 409.0, 182.0, 93.0, 55.0, 30.0, 27.0, 17.0, 9.0, 8.0, 6.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4462890625, -0.4329032897949219, -0.41951751708984375, -0.4061317443847656, -0.3927459716796875, -0.3793601989746094, -0.36597442626953125, -0.3525886535644531, -0.339202880859375, -0.3258171081542969, -0.31243133544921875, -0.2990455627441406, -0.2856597900390625, -0.2722740173339844, -0.25888824462890625, -0.24550247192382812, -0.23211669921875, -0.21873092651367188, -0.20534515380859375, -0.19195938110351562, -0.1785736083984375, -0.16518783569335938, -0.15180206298828125, -0.13841629028320312, -0.125030517578125, -0.11164474487304688, -0.09825897216796875, -0.08487319946289062, -0.0714874267578125, -0.058101654052734375, -0.04471588134765625, -0.031330108642578125, -0.0179443359375, -0.004558563232421875, 0.00882720947265625, 0.022212982177734375, 0.0355987548828125, 0.048984527587890625, 0.06237030029296875, 0.07575607299804688, 0.089141845703125, 0.10252761840820312, 0.11591339111328125, 0.12929916381835938, 0.1426849365234375, 0.15607070922851562, 0.16945648193359375, 0.18284225463867188, 0.19622802734375, 0.20961380004882812, 0.22299957275390625, 0.23638534545898438, 0.2497711181640625, 0.2631568908691406, 0.27654266357421875, 0.2899284362792969, 0.303314208984375, 0.3166999816894531, 0.33008575439453125, 0.3434715270996094, 0.3568572998046875, 0.3702430725097656, 0.38362884521484375, 0.3970146179199219, 0.410400390625]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 2.0, 9.0, 13.0, 16.0, 9.0, 23.0, 35.0, 48.0, 59.0, 106.0, 132.0, 119.0, 113.0, 112.0, 46.0, 49.0, 31.0, 24.0, 13.0, 9.0, 12.0, 5.0, 4.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08697509765625, -0.08391666412353516, -0.08085823059082031, -0.07779979705810547, -0.07474136352539062, -0.07168292999267578, -0.06862449645996094, -0.0655660629272461, -0.06250762939453125, -0.059449195861816406, -0.05639076232910156, -0.05333232879638672, -0.050273895263671875, -0.04721546173095703, -0.04415702819824219, -0.041098594665527344, -0.0380401611328125, -0.034981727600097656, -0.03192329406738281, -0.02886486053466797, -0.025806427001953125, -0.02274799346923828, -0.019689559936523438, -0.016631126403808594, -0.01357269287109375, -0.010514259338378906, -0.0074558258056640625, -0.004397392272949219, -0.001338958740234375, 0.0017194747924804688, 0.0047779083251953125, 0.007836341857910156, 0.010894775390625, 0.013953208923339844, 0.017011642456054688, 0.02007007598876953, 0.023128509521484375, 0.02618694305419922, 0.029245376586914062, 0.032303810119628906, 0.03536224365234375, 0.038420677185058594, 0.04147911071777344, 0.04453754425048828, 0.047595977783203125, 0.05065441131591797, 0.05371284484863281, 0.056771278381347656, 0.0598297119140625, 0.06288814544677734, 0.06594657897949219, 0.06900501251220703, 0.07206344604492188, 0.07512187957763672, 0.07818031311035156, 0.0812387466430664, 0.08429718017578125, 0.0873556137084961, 0.09041404724121094, 0.09347248077392578, 0.09653091430664062, 0.09958934783935547, 0.10264778137207031, 0.10570621490478516, 0.1087646484375]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 13.0, 49.0, 112.0, 210.0, 264.0, 198.0, 92.0, 30.0, 11.0, 14.0, 7.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.367982864379883, -2.284615993499756, -2.201249122619629, -2.117882251739502, -2.034515380859375, -1.951148509979248, -1.867781639099121, -1.7844147682189941, -1.7010478973388672, -1.6176810264587402, -1.5343141555786133, -1.4509472846984863, -1.3675804138183594, -1.2842135429382324, -1.2008466720581055, -1.1174798011779785, -1.0341129302978516, -0.9507460594177246, -0.8673791885375977, -0.7840123176574707, -0.7006454467773438, -0.6172785758972168, -0.5339117050170898, -0.4505448341369629, -0.36717796325683594, -0.283811092376709, -0.20044422149658203, -0.11707735061645508, -0.033710479736328125, 0.04965639114379883, 0.13302326202392578, 0.21639013290405273, 0.2997572422027588, 0.38312411308288574, 0.4664909839630127, 0.5498578548431396, 0.6332247257232666, 0.7165915966033936, 0.7999584674835205, 0.8833253383636475, 0.9666922092437744, 1.0500590801239014, 1.1334259510040283, 1.2167928218841553, 1.3001596927642822, 1.3835265636444092, 1.4668934345245361, 1.550260305404663, 1.63362717628479, 1.716994047164917, 1.800360918045044, 1.883727788925171, 1.9670946598052979, 2.050461530685425, 2.1338284015655518, 2.2171952724456787, 2.3005621433258057, 2.3839290142059326, 2.4672958850860596, 2.5506627559661865, 2.6340296268463135, 2.7173964977264404, 2.8007633686065674, 2.8841302394866943, 2.9674971103668213]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 2.0, 8.0, 6.0, 15.0, 9.0, 13.0, 22.0, 21.0, 23.0, 32.0, 30.0, 34.0, 36.0, 31.0, 43.0, 46.0, 48.0, 51.0, 49.0, 48.0, 45.0, 42.0, 38.0, 34.0, 32.0, 31.0, 20.0, 15.0, 25.0, 21.0, 20.0, 18.0, 16.0, 16.0, 9.0, 13.0, 8.0, 3.0, 10.0, 6.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.428632140159607, -1.3868021965026855, -1.3449722528457642, -1.3031423091888428, -1.2613122463226318, -1.2194823026657104, -1.177652359008789, -1.1358224153518677, -1.0939924716949463, -1.052162528038025, -1.0103325843811035, -0.9685025811195374, -0.926672637462616, -0.8848426938056946, -0.8430126905441284, -0.801182746887207, -0.7593528032302856, -0.7175228595733643, -0.6756929159164429, -0.6338629126548767, -0.5920329689979553, -0.5502030253410339, -0.5083730220794678, -0.4665430784225464, -0.424713134765625, -0.3828831911087036, -0.34105321764945984, -0.29922324419021606, -0.2573933005332947, -0.2155633419752121, -0.17373338341712952, -0.13190340995788574, -0.0900733470916748, -0.048243388533592224, -0.0064134299755096436, 0.03541652858257294, 0.07724648714065552, 0.1190764456987381, 0.16090640425682068, 0.20273637771606445, 0.24456632137298584, 0.2863962650299072, 0.328226238489151, 0.3700562119483948, 0.41188615560531616, 0.45371609926223755, 0.4955460727214813, 0.5373760461807251, 0.5792059898376465, 0.6210359334945679, 0.6628658771514893, 0.7046958804130554, 0.7465258240699768, 0.7883557677268982, 0.8301857709884644, 0.8720157146453857, 0.9138456583023071, 0.9556756019592285, 0.9975055456161499, 1.0393354892730713, 1.0811655521392822, 1.1229954957962036, 1.164825439453125, 1.2066553831100464, 1.2484853267669678]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 7.0, 3.0, 2.0, 4.0, 10.0, 8.0, 13.0, 27.0, 30.0, 48.0, 84.0, 144.0, 240.0, 442.0, 1059.0, 2567.0, 8121.0, 52529.0, 1066541.0, 2839877.0, 197661.0, 18607.0, 3807.0, 1273.0, 542.0, 285.0, 118.0, 78.0, 63.0, 31.0, 24.0, 8.0, 10.0, 10.0, 6.0, 2.0, 2.0, 1.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.86474609375, -0.8361358642578125, -0.807525634765625, -0.7789154052734375, -0.75030517578125, -0.7216949462890625, -0.693084716796875, -0.6644744873046875, -0.6358642578125, -0.6072540283203125, -0.578643798828125, -0.5500335693359375, -0.52142333984375, -0.4928131103515625, -0.464202880859375, -0.4355926513671875, -0.406982421875, -0.3783721923828125, -0.349761962890625, -0.3211517333984375, -0.29254150390625, -0.2639312744140625, -0.235321044921875, -0.2067108154296875, -0.1781005859375, -0.1494903564453125, -0.120880126953125, -0.0922698974609375, -0.06365966796875, -0.0350494384765625, -0.006439208984375, 0.0221710205078125, 0.05078125, 0.0793914794921875, 0.108001708984375, 0.1366119384765625, 0.16522216796875, 0.1938323974609375, 0.222442626953125, 0.2510528564453125, 0.2796630859375, 0.3082733154296875, 0.336883544921875, 0.3654937744140625, 0.39410400390625, 0.4227142333984375, 0.451324462890625, 0.4799346923828125, 0.508544921875, 0.5371551513671875, 0.565765380859375, 0.5943756103515625, 0.62298583984375, 0.6515960693359375, 0.680206298828125, 0.7088165283203125, 0.7374267578125, 0.7660369873046875, 0.794647216796875, 0.8232574462890625, 0.85186767578125, 0.8804779052734375, 0.909088134765625, 0.9376983642578125, 0.96630859375]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 8.0, 7.0, 9.0, 11.0, 26.0, 17.0, 31.0, 36.0, 54.0, 64.0, 75.0, 85.0, 95.0, 92.0, 80.0, 72.0, 60.0, 62.0, 27.0, 31.0, 18.0, 13.0, 8.0, 12.0, 5.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.619140625, -0.5959548950195312, -0.5727691650390625, -0.5495834350585938, -0.526397705078125, -0.5032119750976562, -0.4800262451171875, -0.45684051513671875, -0.43365478515625, -0.41046905517578125, -0.3872833251953125, -0.36409759521484375, -0.340911865234375, -0.31772613525390625, -0.2945404052734375, -0.27135467529296875, -0.2481689453125, -0.22498321533203125, -0.2017974853515625, -0.17861175537109375, -0.155426025390625, -0.13224029541015625, -0.1090545654296875, -0.08586883544921875, -0.06268310546875, -0.03949737548828125, -0.0163116455078125, 0.00687408447265625, 0.030059814453125, 0.05324554443359375, 0.0764312744140625, 0.09961700439453125, 0.122802734375, 0.14598846435546875, 0.1691741943359375, 0.19235992431640625, 0.215545654296875, 0.23873138427734375, 0.2619171142578125, 0.28510284423828125, 0.30828857421875, 0.33147430419921875, 0.3546600341796875, 0.37784576416015625, 0.401031494140625, 0.42421722412109375, 0.4474029541015625, 0.47058868408203125, 0.4937744140625, 0.5169601440429688, 0.5401458740234375, 0.5633316040039062, 0.586517333984375, 0.6097030639648438, 0.6328887939453125, 0.6560745239257812, 0.67926025390625, 0.7024459838867188, 0.7256317138671875, 0.7488174438476562, 0.772003173828125, 0.7951889038085938, 0.8183746337890625, 0.8415603637695312, 0.86474609375]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 5.0, 2.0, 7.0, 12.0, 6.0, 16.0, 30.0, 19.0, 39.0, 75.0, 67.0, 129.0, 206.0, 363.0, 640.0, 1336.0, 2971.0, 9119.0, 42094.0, 519509.0, 3339824.0, 239489.0, 27361.0, 6542.0, 2205.0, 888.0, 465.0, 286.0, 182.0, 118.0, 77.0, 61.0, 37.0, 31.0, 25.0, 15.0, 9.0, 11.0, 4.0, 3.0, 1.0, 1.0, 4.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.6953125, -0.6738357543945312, -0.6523590087890625, -0.6308822631835938, -0.609405517578125, -0.5879287719726562, -0.5664520263671875, -0.5449752807617188, -0.52349853515625, -0.5020217895507812, -0.4805450439453125, -0.45906829833984375, -0.437591552734375, -0.41611480712890625, -0.3946380615234375, -0.37316131591796875, -0.3516845703125, -0.33020782470703125, -0.3087310791015625, -0.28725433349609375, -0.265777587890625, -0.24430084228515625, -0.2228240966796875, -0.20134735107421875, -0.17987060546875, -0.15839385986328125, -0.1369171142578125, -0.11544036865234375, -0.093963623046875, -0.07248687744140625, -0.0510101318359375, -0.02953338623046875, -0.008056640625, 0.01342010498046875, 0.0348968505859375, 0.05637359619140625, 0.077850341796875, 0.09932708740234375, 0.1208038330078125, 0.14228057861328125, 0.16375732421875, 0.18523406982421875, 0.2067108154296875, 0.22818756103515625, 0.249664306640625, 0.27114105224609375, 0.2926177978515625, 0.31409454345703125, 0.3355712890625, 0.35704803466796875, 0.3785247802734375, 0.40000152587890625, 0.421478271484375, 0.44295501708984375, 0.4644317626953125, 0.48590850830078125, 0.50738525390625, 0.5288619995117188, 0.5503387451171875, 0.5718154907226562, 0.593292236328125, 0.6147689819335938, 0.6362457275390625, 0.6577224731445312, 0.67919921875]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 0.0, 1.0, 6.0, 4.0, 13.0, 5.0, 16.0, 16.0, 15.0, 31.0, 38.0, 42.0, 62.0, 108.0, 123.0, 161.0, 237.0, 358.0, 455.0, 498.0, 462.0, 361.0, 297.0, 193.0, 163.0, 128.0, 71.0, 47.0, 48.0, 25.0, 18.0, 18.0, 13.0, 15.0, 5.0, 1.0, 5.0, 4.0, 4.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.14599609375, -0.141387939453125, -0.13677978515625, -0.132171630859375, -0.1275634765625, -0.122955322265625, -0.11834716796875, -0.113739013671875, -0.109130859375, -0.104522705078125, -0.09991455078125, -0.095306396484375, -0.0906982421875, -0.086090087890625, -0.08148193359375, -0.076873779296875, -0.072265625, -0.067657470703125, -0.06304931640625, -0.058441162109375, -0.0538330078125, -0.049224853515625, -0.04461669921875, -0.040008544921875, -0.035400390625, -0.030792236328125, -0.02618408203125, -0.021575927734375, -0.0169677734375, -0.012359619140625, -0.00775146484375, -0.003143310546875, 0.00146484375, 0.006072998046875, 0.01068115234375, 0.015289306640625, 0.0198974609375, 0.024505615234375, 0.02911376953125, 0.033721923828125, 0.038330078125, 0.042938232421875, 0.04754638671875, 0.052154541015625, 0.0567626953125, 0.061370849609375, 0.06597900390625, 0.070587158203125, 0.0751953125, 0.079803466796875, 0.08441162109375, 0.089019775390625, 0.0936279296875, 0.098236083984375, 0.10284423828125, 0.107452392578125, 0.112060546875, 0.116668701171875, 0.12127685546875, 0.125885009765625, 0.1304931640625, 0.135101318359375, 0.13970947265625, 0.144317626953125, 0.14892578125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 15.0, 36.0, 74.0, 169.0, 254.0, 231.0, 129.0, 53.0, 26.0, 12.0, 6.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5428178310394287, -2.4818809032440186, -2.4209437370300293, -2.360006809234619, -2.299069881439209, -2.238132953643799, -2.1771957874298096, -2.1162588596343994, -2.05532169342041, -1.9943846464157104, -1.9334477186203003, -1.8725106716156006, -1.8115737438201904, -1.7506366968154907, -1.689699649810791, -1.6287627220153809, -1.5678257942199707, -1.506888747215271, -1.4459518194198608, -1.3850147724151611, -1.324077844619751, -1.2631407976150513, -1.2022037506103516, -1.1412668228149414, -1.0803297758102417, -1.019392728805542, -0.9584558010101318, -0.8975187540054321, -0.8365817666053772, -0.7756447792053223, -0.7147077322006226, -0.6537707448005676, -0.5928338766098022, -0.5318968892097473, -0.47095987200737, -0.4100228548049927, -0.34908586740493774, -0.2881488800048828, -0.2272118628025055, -0.16627484560012817, -0.10533785820007324, -0.04440085589885712, 0.01653614640235901, 0.07747314870357513, 0.13841015100479126, 0.1993471384048462, 0.2602841556072235, 0.32122117280960083, 0.38215816020965576, 0.4430951476097107, 0.5040321350097656, 0.5649691820144653, 0.6259061694145203, 0.6868431568145752, 0.7477802038192749, 0.8087171912193298, 0.8696541786193848, 0.9305911660194397, 0.9915281534194946, 1.0524652004241943, 1.1134021282196045, 1.1743391752243042, 1.235276222229004, 1.296213150024414, 1.3571501970291138]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 5.0, 2.0, 2.0, 12.0, 5.0, 8.0, 11.0, 8.0, 11.0, 27.0, 18.0, 35.0, 42.0, 46.0, 44.0, 51.0, 69.0, 68.0, 57.0, 52.0, 71.0, 66.0, 34.0, 42.0, 45.0, 33.0, 33.0, 21.0, 26.0, 16.0, 17.0, 8.0, 10.0, 5.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5787622928619385, -0.560859739780426, -0.5429572463035583, -0.5250546932220459, -0.5071521997451782, -0.48924964666366577, -0.4713471233844757, -0.45344460010528564, -0.4355420768260956, -0.4176395535469055, -0.39973703026771545, -0.3818345069885254, -0.36393195390701294, -0.34602946043014526, -0.3281269073486328, -0.31022438406944275, -0.2923218607902527, -0.2744193375110626, -0.25651681423187256, -0.2386142760515213, -0.22071175277233124, -0.20280922949314117, -0.18490669131278992, -0.16700416803359985, -0.1491016447544098, -0.13119912147521973, -0.11329659074544907, -0.0953940600156784, -0.07749153673648834, -0.05958901345729828, -0.04168648272752762, -0.023783951997756958, -0.005881369113922119, 0.012021157890558243, 0.029923684895038605, 0.04782621189951897, 0.06572873890399933, 0.08363126218318939, 0.10153379291296005, 0.11943632364273071, 0.13733884692192078, 0.15524137020111084, 0.1731438934803009, 0.19104643166065216, 0.20894895493984222, 0.2268514782190323, 0.24475401639938354, 0.2626565396785736, 0.28055906295776367, 0.29846158623695374, 0.3163641095161438, 0.33426663279533386, 0.3521691560745239, 0.3700717091560364, 0.38797423243522644, 0.4058767557144165, 0.42377927899360657, 0.44168180227279663, 0.4595843255519867, 0.47748684883117676, 0.4953894019126892, 0.5132918953895569, 0.5311944484710693, 0.549096941947937, 0.5669994950294495]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 1.0, 4.0, 5.0, 4.0, 5.0, 4.0, 10.0, 14.0, 22.0, 24.0, 48.0, 70.0, 97.0, 206.0, 343.0, 636.0, 1356.0, 3449.0, 10597.0, 43657.0, 214361.0, 500400.0, 213078.0, 43099.0, 10714.0, 3439.0, 1428.0, 629.0, 328.0, 197.0, 119.0, 76.0, 42.0, 28.0, 15.0, 14.0, 11.0, 7.0, 8.0, 7.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1339111328125, -0.12965965270996094, -0.12540817260742188, -0.12115669250488281, -0.11690521240234375, -0.11265373229980469, -0.10840225219726562, -0.10415077209472656, -0.0998992919921875, -0.09564781188964844, -0.09139633178710938, -0.08714485168457031, -0.08289337158203125, -0.07864189147949219, -0.07439041137695312, -0.07013893127441406, -0.065887451171875, -0.06163597106933594, -0.057384490966796875, -0.05313301086425781, -0.04888153076171875, -0.04463005065917969, -0.040378570556640625, -0.03612709045410156, -0.0318756103515625, -0.027624130249023438, -0.023372650146484375, -0.019121170043945312, -0.01486968994140625, -0.010618209838867188, -0.006366729736328125, -0.0021152496337890625, 0.00213623046875, 0.0063877105712890625, 0.010639190673828125, 0.014890670776367188, 0.01914215087890625, 0.023393630981445312, 0.027645111083984375, 0.03189659118652344, 0.0361480712890625, 0.04039955139160156, 0.044651031494140625, 0.04890251159667969, 0.05315399169921875, 0.05740547180175781, 0.061656951904296875, 0.06590843200683594, 0.070159912109375, 0.07441139221191406, 0.07866287231445312, 0.08291435241699219, 0.08716583251953125, 0.09141731262207031, 0.09566879272460938, 0.09992027282714844, 0.1041717529296875, 0.10842323303222656, 0.11267471313476562, 0.11692619323730469, 0.12117767333984375, 0.1254291534423828, 0.12968063354492188, 0.13393211364746094, 0.13818359375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 3.0, 11.0, 9.0, 13.0, 15.0, 9.0, 21.0, 41.0, 57.0, 61.0, 79.0, 81.0, 94.0, 91.0, 67.0, 79.0, 64.0, 56.0, 34.0, 42.0, 19.0, 20.0, 10.0, 9.0, 7.0, 6.0, 4.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.517578125, -0.4997711181640625, -0.481964111328125, -0.4641571044921875, -0.44635009765625, -0.4285430908203125, -0.410736083984375, -0.3929290771484375, -0.3751220703125, -0.3573150634765625, -0.339508056640625, -0.3217010498046875, -0.30389404296875, -0.2860870361328125, -0.268280029296875, -0.2504730224609375, -0.232666015625, -0.2148590087890625, -0.197052001953125, -0.1792449951171875, -0.16143798828125, -0.1436309814453125, -0.125823974609375, -0.1080169677734375, -0.0902099609375, -0.0724029541015625, -0.054595947265625, -0.0367889404296875, -0.01898193359375, -0.0011749267578125, 0.016632080078125, 0.0344390869140625, 0.05224609375, 0.0700531005859375, 0.087860107421875, 0.1056671142578125, 0.12347412109375, 0.1412811279296875, 0.159088134765625, 0.1768951416015625, 0.1947021484375, 0.2125091552734375, 0.230316162109375, 0.2481231689453125, 0.26593017578125, 0.2837371826171875, 0.301544189453125, 0.3193511962890625, 0.337158203125, 0.3549652099609375, 0.372772216796875, 0.3905792236328125, 0.40838623046875, 0.4261932373046875, 0.444000244140625, 0.4618072509765625, 0.4796142578125, 0.4974212646484375, 0.515228271484375, 0.5330352783203125, 0.55084228515625, 0.5686492919921875, 0.586456298828125, 0.6042633056640625, 0.6220703125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 5.0, 4.0, 10.0, 25.0, 25.0, 36.0, 40.0, 69.0, 104.0, 181.0, 228.0, 448.0, 800.0, 1497.0, 3080.0, 7404.0, 19631.0, 57645.0, 176319.0, 360270.0, 270348.0, 98368.0, 31649.0, 11263.0, 4570.0, 2058.0, 986.0, 569.0, 326.0, 215.0, 115.0, 89.0, 58.0, 38.0, 30.0, 25.0, 12.0, 5.0, 4.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.08819580078125, -0.0853261947631836, -0.08245658874511719, -0.07958698272705078, -0.07671737670898438, -0.07384777069091797, -0.07097816467285156, -0.06810855865478516, -0.06523895263671875, -0.062369346618652344, -0.05949974060058594, -0.05663013458251953, -0.053760528564453125, -0.05089092254638672, -0.04802131652832031, -0.045151710510253906, -0.0422821044921875, -0.039412498474121094, -0.03654289245605469, -0.03367328643798828, -0.030803680419921875, -0.02793407440185547, -0.025064468383789062, -0.022194862365722656, -0.01932525634765625, -0.016455650329589844, -0.013586044311523438, -0.010716438293457031, -0.007846832275390625, -0.004977226257324219, -0.0021076202392578125, 0.0007619857788085938, 0.003631591796875, 0.006501197814941406, 0.009370803833007812, 0.012240409851074219, 0.015110015869140625, 0.01797962188720703, 0.020849227905273438, 0.023718833923339844, 0.02658843994140625, 0.029458045959472656, 0.03232765197753906, 0.03519725799560547, 0.038066864013671875, 0.04093647003173828, 0.04380607604980469, 0.046675682067871094, 0.0495452880859375, 0.052414894104003906, 0.05528450012207031, 0.05815410614013672, 0.061023712158203125, 0.06389331817626953, 0.06676292419433594, 0.06963253021240234, 0.07250213623046875, 0.07537174224853516, 0.07824134826660156, 0.08111095428466797, 0.08398056030273438, 0.08685016632080078, 0.08971977233886719, 0.0925893783569336, 0.095458984375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 3.0, 2.0, 5.0, 1.0, 3.0, 6.0, 8.0, 2.0, 10.0, 14.0, 11.0, 11.0, 12.0, 25.0, 24.0, 22.0, 32.0, 22.0, 46.0, 41.0, 31.0, 42.0, 37.0, 46.0, 43.0, 43.0, 44.0, 40.0, 44.0, 44.0, 33.0, 40.0, 40.0, 29.0, 18.0, 23.0, 19.0, 20.0, 11.0, 10.0, 14.0, 7.0, 6.0, 5.0, 4.0, 3.0, 3.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.64599609375, -0.6275711059570312, -0.6091461181640625, -0.5907211303710938, -0.572296142578125, -0.5538711547851562, -0.5354461669921875, -0.5170211791992188, -0.49859619140625, -0.48017120361328125, -0.4617462158203125, -0.44332122802734375, -0.424896240234375, -0.40647125244140625, -0.3880462646484375, -0.36962127685546875, -0.3511962890625, -0.33277130126953125, -0.3143463134765625, -0.29592132568359375, -0.277496337890625, -0.25907135009765625, -0.2406463623046875, -0.22222137451171875, -0.20379638671875, -0.18537139892578125, -0.1669464111328125, -0.14852142333984375, -0.130096435546875, -0.11167144775390625, -0.0932464599609375, -0.07482147216796875, -0.056396484375, -0.03797149658203125, -0.0195465087890625, -0.00112152099609375, 0.017303466796875, 0.03572845458984375, 0.0541534423828125, 0.07257843017578125, 0.09100341796875, 0.10942840576171875, 0.1278533935546875, 0.14627838134765625, 0.164703369140625, 0.18312835693359375, 0.2015533447265625, 0.21997833251953125, 0.2384033203125, 0.25682830810546875, 0.2752532958984375, 0.29367828369140625, 0.312103271484375, 0.33052825927734375, 0.3489532470703125, 0.36737823486328125, 0.38580322265625, 0.40422821044921875, 0.4226531982421875, 0.44107818603515625, 0.459503173828125, 0.47792816162109375, 0.4963531494140625, 0.5147781372070312, 0.533203125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 9.0, 7.0, 4.0, 14.0, 26.0, 37.0, 61.0, 79.0, 131.0, 228.0, 411.0, 740.0, 1732.0, 4352.0, 14771.0, 75856.0, 383523.0, 441120.0, 97870.0, 18405.0, 5121.0, 2052.0, 914.0, 421.0, 281.0, 139.0, 83.0, 53.0, 36.0, 22.0, 14.0, 10.0, 10.0, 7.0, 9.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.034454345703125, -0.033226966857910156, -0.03199958801269531, -0.03077220916748047, -0.029544830322265625, -0.02831745147705078, -0.027090072631835938, -0.025862693786621094, -0.02463531494140625, -0.023407936096191406, -0.022180557250976562, -0.02095317840576172, -0.019725799560546875, -0.01849842071533203, -0.017271041870117188, -0.016043663024902344, -0.0148162841796875, -0.013588905334472656, -0.012361526489257812, -0.011134147644042969, -0.009906768798828125, -0.008679389953613281, -0.0074520111083984375, -0.006224632263183594, -0.00499725341796875, -0.0037698745727539062, -0.0025424957275390625, -0.0013151168823242188, -8.7738037109375e-05, 0.0011396408081054688, 0.0023670196533203125, 0.0035943984985351562, 0.00482177734375, 0.006049156188964844, 0.0072765350341796875, 0.008503913879394531, 0.009731292724609375, 0.010958671569824219, 0.012186050415039062, 0.013413429260253906, 0.01464080810546875, 0.015868186950683594, 0.017095565795898438, 0.01832294464111328, 0.019550323486328125, 0.02077770233154297, 0.022005081176757812, 0.023232460021972656, 0.0244598388671875, 0.025687217712402344, 0.026914596557617188, 0.02814197540283203, 0.029369354248046875, 0.03059673309326172, 0.03182411193847656, 0.033051490783691406, 0.03427886962890625, 0.035506248474121094, 0.03673362731933594, 0.03796100616455078, 0.039188385009765625, 0.04041576385498047, 0.04164314270019531, 0.042870521545410156, 0.044097900390625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 6.0, 0.0, 4.0, 7.0, 7.0, 12.0, 13.0, 13.0, 19.0, 30.0, 33.0, 62.0, 44.0, 54.0, 83.0, 103.0, 84.0, 86.0, 71.0, 74.0, 50.0, 37.0, 22.0, 22.0, 21.0, 16.0, 8.0, 5.0, 6.0, 5.0, 2.0, 2.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4662742614746094e-05, -1.4194287359714508e-05, -1.3725832104682922e-05, -1.3257376849651337e-05, -1.2788921594619751e-05, -1.2320466339588165e-05, -1.185201108455658e-05, -1.1383555829524994e-05, -1.0915100574493408e-05, -1.0446645319461823e-05, -9.978190064430237e-06, -9.509734809398651e-06, -9.041279554367065e-06, -8.57282429933548e-06, -8.104369044303894e-06, -7.635913789272308e-06, -7.167458534240723e-06, -6.699003279209137e-06, -6.230548024177551e-06, -5.7620927691459656e-06, -5.29363751411438e-06, -4.825182259082794e-06, -4.3567270040512085e-06, -3.888271749019623e-06, -3.419816493988037e-06, -2.9513612389564514e-06, -2.4829059839248657e-06, -2.01445072889328e-06, -1.5459954738616943e-06, -1.0775402188301086e-06, -6.09084963798523e-07, -1.4062970876693726e-07, 3.2782554626464844e-07, 7.962808012962341e-07, 1.2647360563278198e-06, 1.7331913113594055e-06, 2.201646566390991e-06, 2.670101821422577e-06, 3.1385570764541626e-06, 3.6070123314857483e-06, 4.075467586517334e-06, 4.54392284154892e-06, 5.012378096580505e-06, 5.480833351612091e-06, 5.949288606643677e-06, 6.4177438616752625e-06, 6.886199116706848e-06, 7.354654371738434e-06, 7.82310962677002e-06, 8.291564881801605e-06, 8.760020136833191e-06, 9.228475391864777e-06, 9.696930646896362e-06, 1.0165385901927948e-05, 1.0633841156959534e-05, 1.110229641199112e-05, 1.1570751667022705e-05, 1.203920692205429e-05, 1.2507662177085876e-05, 1.2976117432117462e-05, 1.3444572687149048e-05, 1.3913027942180634e-05, 1.438148319721222e-05, 1.4849938452243805e-05, 1.531839370727539e-05]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 1.0, 4.0, 2.0, 1.0, 7.0, 11.0, 7.0, 11.0, 13.0, 19.0, 26.0, 26.0, 38.0, 60.0, 116.0, 160.0, 270.0, 462.0, 842.0, 1974.0, 5439.0, 17122.0, 58764.0, 189612.0, 371358.0, 268750.0, 92770.0, 26813.0, 8316.0, 2893.0, 1153.0, 603.0, 310.0, 191.0, 121.0, 90.0, 60.0, 42.0, 30.0, 27.0, 12.0, 16.0, 7.0, 4.0, 4.0, 6.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0235595703125, -0.022708654403686523, -0.021857738494873047, -0.02100682258605957, -0.020155906677246094, -0.019304990768432617, -0.01845407485961914, -0.017603158950805664, -0.016752243041992188, -0.01590132713317871, -0.015050411224365234, -0.014199495315551758, -0.013348579406738281, -0.012497663497924805, -0.011646747589111328, -0.010795831680297852, -0.009944915771484375, -0.009093999862670898, -0.008243083953857422, -0.007392168045043945, -0.006541252136230469, -0.005690336227416992, -0.004839420318603516, -0.003988504409790039, -0.0031375885009765625, -0.002286672592163086, -0.0014357566833496094, -0.0005848407745361328, 0.00026607513427734375, 0.0011169910430908203, 0.001967906951904297, 0.0028188228607177734, 0.00366973876953125, 0.0045206546783447266, 0.005371570587158203, 0.00622248649597168, 0.007073402404785156, 0.007924318313598633, 0.00877523422241211, 0.009626150131225586, 0.010477066040039062, 0.011327981948852539, 0.012178897857666016, 0.013029813766479492, 0.013880729675292969, 0.014731645584106445, 0.015582561492919922, 0.0164334774017334, 0.017284393310546875, 0.01813530921936035, 0.018986225128173828, 0.019837141036987305, 0.02068805694580078, 0.021538972854614258, 0.022389888763427734, 0.02324080467224121, 0.024091720581054688, 0.024942636489868164, 0.02579355239868164, 0.026644468307495117, 0.027495384216308594, 0.02834630012512207, 0.029197216033935547, 0.030048131942749023, 0.0308990478515625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 7.0, 5.0, 4.0, 6.0, 15.0, 9.0, 18.0, 14.0, 15.0, 19.0, 27.0, 27.0, 34.0, 40.0, 40.0, 35.0, 44.0, 55.0, 46.0, 51.0, 32.0, 43.0, 49.0, 43.0, 52.0, 39.0, 38.0, 30.0, 36.0, 14.0, 22.0, 11.0, 11.0, 15.0, 13.0, 5.0, 10.0, 8.0, 4.0, 3.0, 0.0, 3.0, 3.0, 2.0, 1.0, 2.0, 4.0, 0.0, 1.0, 2.0, 3.0], "bins": [-0.00684356689453125, -0.006635427474975586, -0.006427288055419922, -0.006219148635864258, -0.006011009216308594, -0.00580286979675293, -0.005594730377197266, -0.0053865909576416016, -0.0051784515380859375, -0.0049703121185302734, -0.004762172698974609, -0.004554033279418945, -0.004345893859863281, -0.004137754440307617, -0.003929615020751953, -0.003721475601196289, -0.003513336181640625, -0.003305196762084961, -0.003097057342529297, -0.002888917922973633, -0.0026807785034179688, -0.0024726390838623047, -0.0022644996643066406, -0.0020563602447509766, -0.0018482208251953125, -0.0016400814056396484, -0.0014319419860839844, -0.0012238025665283203, -0.0010156631469726562, -0.0008075237274169922, -0.0005993843078613281, -0.00039124488830566406, -0.00018310546875, 2.5033950805664062e-05, 0.00023317337036132812, 0.0004413127899169922, 0.0006494522094726562, 0.0008575916290283203, 0.0010657310485839844, 0.0012738704681396484, 0.0014820098876953125, 0.0016901493072509766, 0.0018982887268066406, 0.0021064281463623047, 0.0023145675659179688, 0.002522706985473633, 0.002730846405029297, 0.002938985824584961, 0.003147125244140625, 0.003355264663696289, 0.003563404083251953, 0.003771543502807617, 0.003979682922363281, 0.004187822341918945, 0.004395961761474609, 0.0046041011810302734, 0.0048122406005859375, 0.0050203800201416016, 0.005228519439697266, 0.00543665885925293, 0.005644798278808594, 0.005852937698364258, 0.006061077117919922, 0.006269216537475586, 0.00647735595703125]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 106.0, 719.0, 169.0, 15.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.54862117767334, -6.416533470153809, -6.284445762634277, -6.152358531951904, -6.020270824432373, -5.888183116912842, -5.7560954093933105, -5.6240081787109375, -5.491920471191406, -5.359832763671875, -5.227745056152344, -5.095657825469971, -4.9635701179504395, -4.831482410430908, -4.699394702911377, -4.567307472229004, -4.435219764709473, -4.303132057189941, -4.17104434967041, -4.038957118988037, -3.906869411468506, -3.7747817039489746, -3.6426939964294434, -3.510606527328491, -3.378518581390381, -3.2464308738708496, -3.1143434047698975, -2.982255697250366, -2.850168228149414, -2.718080520629883, -2.5859928131103516, -2.4539053440093994, -2.321817398071289, -2.189729690551758, -2.0576422214508057, -1.9255545139312744, -1.7934670448303223, -1.661379337310791, -1.5292917490005493, -1.3972041606903076, -1.2651166915893555, -1.1330291032791138, -1.000941514968872, -0.8688538670539856, -0.7367662787437439, -0.6046786904335022, -0.4725910425186157, -0.340503454208374, -0.20841586589813232, -0.07632826268672943, 0.05575934052467346, 0.18784695863723755, 0.31993454694747925, 0.45202213525772095, 0.5841097831726074, 0.7161973714828491, 0.8482849597930908, 0.9803725481033325, 1.1124601364135742, 1.2445478439331055, 1.3766353130340576, 1.5087230205535889, 1.6408106088638306, 1.7728981971740723, 1.904985785484314]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 1.0, 12.0, 6.0, 16.0, 9.0, 15.0, 20.0, 31.0, 44.0, 65.0, 59.0, 73.0, 95.0, 77.0, 76.0, 77.0, 65.0, 51.0, 57.0, 32.0, 35.0, 31.0, 17.0, 15.0, 10.0, 7.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4810790717601776, -0.4649052023887634, -0.44873133301734924, -0.43255746364593506, -0.4163835644721985, -0.4002097249031067, -0.3840358257293701, -0.36786195635795593, -0.35168808698654175, -0.33551421761512756, -0.3193403482437134, -0.3031664788722992, -0.286992609500885, -0.27081871032714844, -0.25464484095573425, -0.23847097158432007, -0.22229710221290588, -0.2061232328414917, -0.18994936347007751, -0.17377547919750214, -0.15760160982608795, -0.14142774045467377, -0.1252538561820984, -0.1090799868106842, -0.09290611743927002, -0.07673224806785583, -0.06055837124586105, -0.04438449814915657, -0.028210625052452087, -0.012036755681037903, 0.004137121140956879, 0.02031099796295166, 0.03648489713668823, 0.052658770233392715, 0.0688326433300972, 0.08500652015209198, 0.10118038952350616, 0.11735425889492035, 0.13352814316749573, 0.1497020125389099, 0.1658758819103241, 0.18204975128173828, 0.19822362065315247, 0.21439750492572784, 0.23057137429714203, 0.2467452436685562, 0.2629191279411316, 0.2790929973125458, 0.29526686668395996, 0.31144073605537415, 0.32761460542678833, 0.3437884747982025, 0.3599623441696167, 0.37613624334335327, 0.39231011271476746, 0.40848398208618164, 0.4246578514575958, 0.44083172082901, 0.4570055902004242, 0.4731794595718384, 0.48935335874557495, 0.5055271983146667, 0.5217010974884033, 0.5378749370574951, 0.5540488362312317]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 5.0, 2.0, 6.0, 12.0, 17.0, 11.0, 39.0, 39.0, 45.0, 83.0, 124.0, 193.0, 335.0, 493.0, 907.0, 1525.0, 2758.0, 5138.0, 10086.0, 21885.0, 52350.0, 137776.0, 382266.0, 267578.0, 94268.0, 37244.0, 16279.0, 7647.0, 4067.0, 2168.0, 1267.0, 738.0, 422.0, 305.0, 156.0, 122.0, 64.0, 54.0, 20.0, 24.0, 14.0, 8.0, 5.0, 11.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.18994140625, -0.18377685546875, -0.1776123046875, -0.17144775390625, -0.165283203125, -0.15911865234375, -0.1529541015625, -0.14678955078125, -0.140625, -0.13446044921875, -0.1282958984375, -0.12213134765625, -0.115966796875, -0.10980224609375, -0.1036376953125, -0.09747314453125, -0.09130859375, -0.08514404296875, -0.0789794921875, -0.07281494140625, -0.066650390625, -0.06048583984375, -0.0543212890625, -0.04815673828125, -0.0419921875, -0.03582763671875, -0.0296630859375, -0.02349853515625, -0.017333984375, -0.01116943359375, -0.0050048828125, 0.00115966796875, 0.00732421875, 0.01348876953125, 0.0196533203125, 0.02581787109375, 0.031982421875, 0.03814697265625, 0.0443115234375, 0.05047607421875, 0.056640625, 0.06280517578125, 0.0689697265625, 0.07513427734375, 0.081298828125, 0.08746337890625, 0.0936279296875, 0.09979248046875, 0.10595703125, 0.11212158203125, 0.1182861328125, 0.12445068359375, 0.130615234375, 0.13677978515625, 0.1429443359375, 0.14910888671875, 0.1552734375, 0.16143798828125, 0.1676025390625, 0.17376708984375, 0.179931640625, 0.18609619140625, 0.1922607421875, 0.19842529296875, 0.20458984375]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 5.0, 5.0, 3.0, 14.0, 3.0, 8.0, 14.0, 11.0, 16.0, 20.0, 32.0, 52.0, 45.0, 63.0, 43.0, 61.0, 71.0, 75.0, 69.0, 65.0, 52.0, 57.0, 34.0, 41.0, 31.0, 33.0, 13.0, 19.0, 11.0, 19.0, 5.0, 9.0, 0.0, 6.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.96044921875, -0.9340896606445312, -0.9077301025390625, -0.8813705444335938, -0.855010986328125, -0.8286514282226562, -0.8022918701171875, -0.7759323120117188, -0.74957275390625, -0.7232131958007812, -0.6968536376953125, -0.6704940795898438, -0.644134521484375, -0.6177749633789062, -0.5914154052734375, -0.5650558471679688, -0.5386962890625, -0.5123367309570312, -0.4859771728515625, -0.45961761474609375, -0.433258056640625, -0.40689849853515625, -0.3805389404296875, -0.35417938232421875, -0.32781982421875, -0.30146026611328125, -0.2751007080078125, -0.24874114990234375, -0.222381591796875, -0.19602203369140625, -0.1696624755859375, -0.14330291748046875, -0.116943359375, -0.09058380126953125, -0.0642242431640625, -0.03786468505859375, -0.011505126953125, 0.01485443115234375, 0.0412139892578125, 0.06757354736328125, 0.09393310546875, 0.12029266357421875, 0.1466522216796875, 0.17301177978515625, 0.199371337890625, 0.22573089599609375, 0.2520904541015625, 0.27845001220703125, 0.3048095703125, 0.33116912841796875, 0.3575286865234375, 0.38388824462890625, 0.410247802734375, 0.43660736083984375, 0.4629669189453125, 0.48932647705078125, 0.51568603515625, 0.5420455932617188, 0.5684051513671875, 0.5947647094726562, 0.621124267578125, 0.6474838256835938, 0.6738433837890625, 0.7002029418945312, 0.7265625]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 2.0, 2.0, 9.0, 4.0, 9.0, 10.0, 22.0, 29.0, 30.0, 64.0, 100.0, 142.0, 257.0, 532.0, 1692.0, 11559.0, 394254.0, 621080.0, 15446.0, 1968.0, 578.0, 304.0, 154.0, 95.0, 62.0, 42.0, 26.0, 27.0, 9.0, 10.0, 10.0, 8.0, 5.0, 3.0, 4.0, 6.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.671875, -0.6487503051757812, -0.6256256103515625, -0.6025009155273438, -0.579376220703125, -0.5562515258789062, -0.5331268310546875, -0.5100021362304688, -0.48687744140625, -0.46375274658203125, -0.4406280517578125, -0.41750335693359375, -0.394378662109375, -0.37125396728515625, -0.3481292724609375, -0.32500457763671875, -0.3018798828125, -0.27875518798828125, -0.2556304931640625, -0.23250579833984375, -0.209381103515625, -0.18625640869140625, -0.1631317138671875, -0.14000701904296875, -0.11688232421875, -0.09375762939453125, -0.0706329345703125, -0.04750823974609375, -0.024383544921875, -0.00125885009765625, 0.0218658447265625, 0.04499053955078125, 0.068115234375, 0.09123992919921875, 0.1143646240234375, 0.13748931884765625, 0.160614013671875, 0.18373870849609375, 0.2068634033203125, 0.22998809814453125, 0.25311279296875, 0.27623748779296875, 0.2993621826171875, 0.32248687744140625, 0.345611572265625, 0.36873626708984375, 0.3918609619140625, 0.41498565673828125, 0.4381103515625, 0.46123504638671875, 0.4843597412109375, 0.5074844360351562, 0.530609130859375, 0.5537338256835938, 0.5768585205078125, 0.5999832153320312, 0.62310791015625, 0.6462326049804688, 0.6693572998046875, 0.6924819946289062, 0.715606689453125, 0.7387313842773438, 0.7618560791015625, 0.7849807739257812, 0.80810546875]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 5.0, 2.0, 4.0, 4.0, 5.0, 6.0, 16.0, 15.0, 17.0, 19.0, 17.0, 34.0, 26.0, 33.0, 47.0, 31.0, 41.0, 56.0, 56.0, 48.0, 63.0, 55.0, 54.0, 56.0, 45.0, 47.0, 33.0, 34.0, 24.0, 22.0, 19.0, 23.0, 15.0, 11.0, 10.0, 6.0, 6.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8916015625, -0.8628463745117188, -0.8340911865234375, -0.8053359985351562, -0.776580810546875, -0.7478256225585938, -0.7190704345703125, -0.6903152465820312, -0.66156005859375, -0.6328048706054688, -0.6040496826171875, -0.5752944946289062, -0.546539306640625, -0.5177841186523438, -0.4890289306640625, -0.46027374267578125, -0.4315185546875, -0.40276336669921875, -0.3740081787109375, -0.34525299072265625, -0.316497802734375, -0.28774261474609375, -0.2589874267578125, -0.23023223876953125, -0.20147705078125, -0.17272186279296875, -0.1439666748046875, -0.11521148681640625, -0.086456298828125, -0.05770111083984375, -0.0289459228515625, -0.00019073486328125, 0.028564453125, 0.05731964111328125, 0.0860748291015625, 0.11483001708984375, 0.143585205078125, 0.17234039306640625, 0.2010955810546875, 0.22985076904296875, 0.25860595703125, 0.28736114501953125, 0.3161163330078125, 0.34487152099609375, 0.373626708984375, 0.40238189697265625, 0.4311370849609375, 0.45989227294921875, 0.4886474609375, 0.5174026489257812, 0.5461578369140625, 0.5749130249023438, 0.603668212890625, 0.6324234008789062, 0.6611785888671875, 0.6899337768554688, 0.71868896484375, 0.7474441528320312, 0.7761993408203125, 0.8049545288085938, 0.833709716796875, 0.8624649047851562, 0.8912200927734375, 0.9199752807617188, 0.94873046875]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 5.0, 8.0, 8.0, 18.0, 12.0, 37.0, 61.0, 117.0, 280.0, 808.0, 3246.0, 32019.0, 965345.0, 41529.0, 3597.0, 867.0, 285.0, 146.0, 59.0, 36.0, 24.0, 21.0, 8.0, 4.0, 3.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.326416015625, -0.3145599365234375, -0.302703857421875, -0.2908477783203125, -0.27899169921875, -0.2671356201171875, -0.255279541015625, -0.2434234619140625, -0.2315673828125, -0.2197113037109375, -0.207855224609375, -0.1959991455078125, -0.18414306640625, -0.1722869873046875, -0.160430908203125, -0.1485748291015625, -0.13671875, -0.1248626708984375, -0.113006591796875, -0.1011505126953125, -0.08929443359375, -0.0774383544921875, -0.065582275390625, -0.0537261962890625, -0.0418701171875, -0.0300140380859375, -0.018157958984375, -0.0063018798828125, 0.00555419921875, 0.0174102783203125, 0.029266357421875, 0.0411224365234375, 0.052978515625, 0.0648345947265625, 0.076690673828125, 0.0885467529296875, 0.10040283203125, 0.1122589111328125, 0.124114990234375, 0.1359710693359375, 0.1478271484375, 0.1596832275390625, 0.171539306640625, 0.1833953857421875, 0.19525146484375, 0.2071075439453125, 0.218963623046875, 0.2308197021484375, 0.24267578125, 0.2545318603515625, 0.266387939453125, 0.2782440185546875, 0.29010009765625, 0.3019561767578125, 0.313812255859375, 0.3256683349609375, 0.3375244140625, 0.3493804931640625, 0.361236572265625, 0.3730926513671875, 0.38494873046875, 0.3968048095703125, 0.408660888671875, 0.4205169677734375, 0.432373046875]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 5.0, 1.0, 1.0, 7.0, 11.0, 11.0, 20.0, 39.0, 46.0, 67.0, 83.0, 152.0, 182.0, 114.0, 80.0, 60.0, 37.0, 42.0, 18.0, 8.0, 7.0, 3.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.641843795776367e-05, -3.54154035449028e-05, -3.441236913204193e-05, -3.340933471918106e-05, -3.240630030632019e-05, -3.140326589345932e-05, -3.040023148059845e-05, -2.939719706773758e-05, -2.839416265487671e-05, -2.739112824201584e-05, -2.6388093829154968e-05, -2.5385059416294098e-05, -2.4382025003433228e-05, -2.3378990590572357e-05, -2.2375956177711487e-05, -2.1372921764850616e-05, -2.0369887351989746e-05, -1.9366852939128876e-05, -1.8363818526268005e-05, -1.7360784113407135e-05, -1.6357749700546265e-05, -1.5354715287685394e-05, -1.4351680874824524e-05, -1.3348646461963654e-05, -1.2345612049102783e-05, -1.1342577636241913e-05, -1.0339543223381042e-05, -9.336508810520172e-06, -8.333474397659302e-06, -7.330439984798431e-06, -6.327405571937561e-06, -5.324371159076691e-06, -4.32133674621582e-06, -3.31830233335495e-06, -2.3152679204940796e-06, -1.3122335076332092e-06, -3.0919909477233887e-07, 6.938353180885315e-07, 1.6968697309494019e-06, 2.6999041438102722e-06, 3.7029385566711426e-06, 4.705972969532013e-06, 5.709007382392883e-06, 6.712041795253754e-06, 7.715076208114624e-06, 8.718110620975494e-06, 9.721145033836365e-06, 1.0724179446697235e-05, 1.1727213859558105e-05, 1.2730248272418976e-05, 1.3733282685279846e-05, 1.4736317098140717e-05, 1.5739351511001587e-05, 1.6742385923862457e-05, 1.7745420336723328e-05, 1.8748454749584198e-05, 1.975148916244507e-05, 2.075452357530594e-05, 2.175755798816681e-05, 2.276059240102768e-05, 2.376362681388855e-05, 2.476666122674942e-05, 2.576969563961029e-05, 2.677273005247116e-05, 2.777576446533203e-05]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 3.0, 4.0, 8.0, 13.0, 15.0, 37.0, 46.0, 86.0, 199.0, 539.0, 1769.0, 9284.0, 318171.0, 701829.0, 13194.0, 2270.0, 579.0, 238.0, 102.0, 50.0, 37.0, 18.0, 23.0, 8.0, 10.0, 7.0, 7.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.311767578125, -0.30025482177734375, -0.2887420654296875, -0.27722930908203125, -0.265716552734375, -0.25420379638671875, -0.2426910400390625, -0.23117828369140625, -0.21966552734375, -0.20815277099609375, -0.1966400146484375, -0.18512725830078125, -0.173614501953125, -0.16210174560546875, -0.1505889892578125, -0.13907623291015625, -0.1275634765625, -0.11605072021484375, -0.1045379638671875, -0.09302520751953125, -0.081512451171875, -0.06999969482421875, -0.0584869384765625, -0.04697418212890625, -0.03546142578125, -0.02394866943359375, -0.0124359130859375, -0.00092315673828125, 0.010589599609375, 0.02210235595703125, 0.0336151123046875, 0.04512786865234375, 0.056640625, 0.06815338134765625, 0.0796661376953125, 0.09117889404296875, 0.102691650390625, 0.11420440673828125, 0.1257171630859375, 0.13722991943359375, 0.14874267578125, 0.16025543212890625, 0.1717681884765625, 0.18328094482421875, 0.194793701171875, 0.20630645751953125, 0.2178192138671875, 0.22933197021484375, 0.2408447265625, 0.25235748291015625, 0.2638702392578125, 0.27538299560546875, 0.286895751953125, 0.29840850830078125, 0.3099212646484375, 0.32143402099609375, 0.33294677734375, 0.34445953369140625, 0.3559722900390625, 0.36748504638671875, 0.378997802734375, 0.39051055908203125, 0.4020233154296875, 0.41353607177734375, 0.425048828125]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 4.0, 0.0, 2.0, 3.0, 5.0, 3.0, 4.0, 0.0, 7.0, 6.0, 7.0, 10.0, 19.0, 20.0, 37.0, 49.0, 84.0, 101.0, 153.0, 145.0, 97.0, 78.0, 51.0, 29.0, 30.0, 13.0, 14.0, 12.0, 7.0, 5.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.08868408203125, -0.08635950088500977, -0.08403491973876953, -0.0817103385925293, -0.07938575744628906, -0.07706117630004883, -0.0747365951538086, -0.07241201400756836, -0.07008743286132812, -0.06776285171508789, -0.06543827056884766, -0.06311368942260742, -0.06078910827636719, -0.05846452713012695, -0.05613994598388672, -0.053815364837646484, -0.05149078369140625, -0.049166202545166016, -0.04684162139892578, -0.04451704025268555, -0.04219245910644531, -0.03986787796020508, -0.037543296813964844, -0.03521871566772461, -0.032894134521484375, -0.03056955337524414, -0.028244972229003906, -0.025920391082763672, -0.023595809936523438, -0.021271228790283203, -0.01894664764404297, -0.016622066497802734, -0.0142974853515625, -0.011972904205322266, -0.009648323059082031, -0.007323741912841797, -0.0049991607666015625, -0.002674579620361328, -0.00034999847412109375, 0.0019745826721191406, 0.004299163818359375, 0.006623744964599609, 0.008948326110839844, 0.011272907257080078, 0.013597488403320312, 0.015922069549560547, 0.01824665069580078, 0.020571231842041016, 0.02289581298828125, 0.025220394134521484, 0.02754497528076172, 0.029869556427001953, 0.03219413757324219, 0.03451871871948242, 0.036843299865722656, 0.03916788101196289, 0.041492462158203125, 0.04381704330444336, 0.046141624450683594, 0.04846620559692383, 0.05079078674316406, 0.0531153678894043, 0.05543994903564453, 0.057764530181884766, 0.060089111328125]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 10.0, 42.0, 87.0, 214.0, 291.0, 213.0, 77.0, 34.0, 16.0, 9.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.911703586578369, -2.8270459175109863, -2.7423884868621826, -2.6577308177948, -2.573073387145996, -2.4884157180786133, -2.4037580490112305, -2.3191003799438477, -2.234442949295044, -2.149785280227661, -2.0651278495788574, -1.9804701805114746, -1.8958126306533813, -1.811155080795288, -1.7264974117279053, -1.641839861869812, -1.5571823120117188, -1.4725247621536255, -1.3878672122955322, -1.3032095432281494, -1.2185519933700562, -1.133894443511963, -1.04923677444458, -0.9645792245864868, -0.8799216747283936, -0.7952641248703003, -0.7106065154075623, -0.6259489059448242, -0.541291356086731, -0.4566337764263153, -0.37197619676589966, -0.2873185873031616, -0.20266127586364746, -0.11800369620323181, -0.03334611654281616, 0.05131146311759949, 0.13596904277801514, 0.2206266224384308, 0.30528420209884644, 0.3899418115615845, 0.47459936141967773, 0.559256911277771, 0.643914520740509, 0.7285721302032471, 0.8132296800613403, 0.8978872299194336, 0.9825448393821716, 1.0672024488449097, 1.151859998703003, 1.2365175485610962, 1.3211750984191895, 1.4058327674865723, 1.4904903173446655, 1.5751478672027588, 1.6598055362701416, 1.7444630861282349, 1.8291206359863281, 1.9137781858444214, 1.9984357357025146, 2.0830934047698975, 2.167750835418701, 2.252408504486084, 2.337066173553467, 2.4217238426208496, 2.5063812732696533]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 0.0, 1.0, 1.0, 5.0, 8.0, 10.0, 15.0, 12.0, 15.0, 21.0, 16.0, 23.0, 29.0, 27.0, 28.0, 33.0, 38.0, 45.0, 44.0, 45.0, 60.0, 42.0, 43.0, 45.0, 36.0, 42.0, 37.0, 38.0, 36.0, 35.0, 28.0, 24.0, 27.0, 24.0, 15.0, 8.0, 8.0, 6.0, 13.0, 12.0, 3.0, 6.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.16165292263031, -1.122979760169983, -1.0843065977096558, -1.0456334352493286, -1.0069602727890015, -0.9682871103286743, -0.9296139478683472, -0.89094078540802, -0.8522676229476929, -0.8135944604873657, -0.7749212980270386, -0.7362481355667114, -0.6975749731063843, -0.6589018106460571, -0.62022864818573, -0.5815554857254028, -0.5428823232650757, -0.5042091608047485, -0.4655359983444214, -0.42686283588409424, -0.3881896734237671, -0.34951651096343994, -0.3108433485031128, -0.27217018604278564, -0.2334970235824585, -0.19482386112213135, -0.1561506986618042, -0.11747753620147705, -0.0788043737411499, -0.040131211280822754, -0.0014580488204956055, 0.03721511363983154, 0.07588815689086914, 0.11456131935119629, 0.15323448181152344, 0.19190764427185059, 0.23058080673217773, 0.2692539691925049, 0.30792713165283203, 0.3466002941131592, 0.38527345657348633, 0.4239466190338135, 0.4626197814941406, 0.5012929439544678, 0.5399661064147949, 0.5786392688751221, 0.6173124313354492, 0.6559855937957764, 0.6946587562561035, 0.7333319187164307, 0.7720050811767578, 0.810678243637085, 0.8493514060974121, 0.8880245685577393, 0.9266977310180664, 0.9653708934783936, 1.0040440559387207, 1.0427172183990479, 1.081390380859375, 1.1200635433197021, 1.1587367057800293, 1.1974098682403564, 1.2360830307006836, 1.2747561931610107, 1.313429355621338]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 6.0, 1.0, 4.0, 7.0, 12.0, 13.0, 24.0, 31.0, 46.0, 69.0, 114.0, 245.0, 548.0, 1382.0, 4678.0, 36943.0, 2250496.0, 1856220.0, 36526.0, 4608.0, 1228.0, 544.0, 250.0, 128.0, 59.0, 37.0, 24.0, 15.0, 18.0, 5.0, 4.0, 4.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.724609375, -1.6862640380859375, -1.647918701171875, -1.6095733642578125, -1.57122802734375, -1.5328826904296875, -1.494537353515625, -1.4561920166015625, -1.4178466796875, -1.3795013427734375, -1.341156005859375, -1.3028106689453125, -1.26446533203125, -1.2261199951171875, -1.187774658203125, -1.1494293212890625, -1.111083984375, -1.0727386474609375, -1.034393310546875, -0.9960479736328125, -0.95770263671875, -0.9193572998046875, -0.881011962890625, -0.8426666259765625, -0.8043212890625, -0.7659759521484375, -0.727630615234375, -0.6892852783203125, -0.65093994140625, -0.6125946044921875, -0.574249267578125, -0.5359039306640625, -0.49755859375, -0.4592132568359375, -0.420867919921875, -0.3825225830078125, -0.34417724609375, -0.3058319091796875, -0.267486572265625, -0.2291412353515625, -0.1907958984375, -0.1524505615234375, -0.114105224609375, -0.0757598876953125, -0.03741455078125, 0.0009307861328125, 0.039276123046875, 0.0776214599609375, 0.115966796875, 0.1543121337890625, 0.192657470703125, 0.2310028076171875, 0.26934814453125, 0.3076934814453125, 0.346038818359375, 0.3843841552734375, 0.4227294921875, 0.4610748291015625, 0.499420166015625, 0.5377655029296875, 0.57611083984375, 0.6144561767578125, 0.652801513671875, 0.6911468505859375, 0.7294921875]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 4.0, 5.0, 2.0, 6.0, 8.0, 19.0, 19.0, 26.0, 24.0, 48.0, 46.0, 58.0, 57.0, 72.0, 77.0, 67.0, 77.0, 64.0, 72.0, 46.0, 43.0, 48.0, 23.0, 22.0, 16.0, 17.0, 17.0, 8.0, 4.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.56884765625, -0.5518035888671875, -0.534759521484375, -0.5177154541015625, -0.50067138671875, -0.4836273193359375, -0.466583251953125, -0.4495391845703125, -0.4324951171875, -0.4154510498046875, -0.398406982421875, -0.3813629150390625, -0.36431884765625, -0.3472747802734375, -0.330230712890625, -0.3131866455078125, -0.296142578125, -0.2790985107421875, -0.262054443359375, -0.2450103759765625, -0.22796630859375, -0.2109222412109375, -0.193878173828125, -0.1768341064453125, -0.1597900390625, -0.1427459716796875, -0.125701904296875, -0.1086578369140625, -0.09161376953125, -0.0745697021484375, -0.057525634765625, -0.0404815673828125, -0.0234375, -0.0063934326171875, 0.010650634765625, 0.0276947021484375, 0.04473876953125, 0.0617828369140625, 0.078826904296875, 0.0958709716796875, 0.1129150390625, 0.1299591064453125, 0.147003173828125, 0.1640472412109375, 0.18109130859375, 0.1981353759765625, 0.215179443359375, 0.2322235107421875, 0.249267578125, 0.2663116455078125, 0.283355712890625, 0.3003997802734375, 0.31744384765625, 0.3344879150390625, 0.351531982421875, 0.3685760498046875, 0.3856201171875, 0.4026641845703125, 0.419708251953125, 0.4367523193359375, 0.45379638671875, 0.4708404541015625, 0.487884521484375, 0.5049285888671875, 0.52197265625]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 6.0, 5.0, 7.0, 11.0, 19.0, 36.0, 61.0, 98.0, 202.0, 545.0, 1821.0, 10438.0, 397189.0, 3740012.0, 38715.0, 3584.0, 891.0, 336.0, 128.0, 80.0, 38.0, 20.0, 18.0, 7.0, 8.0, 6.0, 0.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.158203125, -1.1171875, -1.076171875, -1.03515625, -0.994140625, -0.953125, -0.912109375, -0.87109375, -0.830078125, -0.7890625, -0.748046875, -0.70703125, -0.666015625, -0.625, -0.583984375, -0.54296875, -0.501953125, -0.4609375, -0.419921875, -0.37890625, -0.337890625, -0.296875, -0.255859375, -0.21484375, -0.173828125, -0.1328125, -0.091796875, -0.05078125, -0.009765625, 0.03125, 0.072265625, 0.11328125, 0.154296875, 0.1953125, 0.236328125, 0.27734375, 0.318359375, 0.359375, 0.400390625, 0.44140625, 0.482421875, 0.5234375, 0.564453125, 0.60546875, 0.646484375, 0.6875, 0.728515625, 0.76953125, 0.810546875, 0.8515625, 0.892578125, 0.93359375, 0.974609375, 1.015625, 1.056640625, 1.09765625, 1.138671875, 1.1796875, 1.220703125, 1.26171875, 1.302734375, 1.34375, 1.384765625, 1.42578125, 1.466796875]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 8.0, 10.0, 7.0, 9.0, 19.0, 35.0, 56.0, 69.0, 130.0, 185.0, 307.0, 524.0, 686.0, 696.0, 491.0, 300.0, 209.0, 96.0, 68.0, 56.0, 34.0, 23.0, 17.0, 17.0, 4.0, 11.0, 3.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2154541015625, -0.20891380310058594, -0.20237350463867188, -0.1958332061767578, -0.18929290771484375, -0.1827526092529297, -0.17621231079101562, -0.16967201232910156, -0.1631317138671875, -0.15659141540527344, -0.15005111694335938, -0.1435108184814453, -0.13697052001953125, -0.1304302215576172, -0.12388992309570312, -0.11734962463378906, -0.110809326171875, -0.10426902770996094, -0.09772872924804688, -0.09118843078613281, -0.08464813232421875, -0.07810783386230469, -0.07156753540039062, -0.06502723693847656, -0.0584869384765625, -0.05194664001464844, -0.045406341552734375, -0.03886604309082031, -0.03232574462890625, -0.025785446166992188, -0.019245147705078125, -0.012704849243164062, -0.00616455078125, 0.0003757476806640625, 0.006916046142578125, 0.013456344604492188, 0.01999664306640625, 0.026536941528320312, 0.033077239990234375, 0.03961753845214844, 0.0461578369140625, 0.05269813537597656, 0.059238433837890625, 0.06577873229980469, 0.07231903076171875, 0.07885932922363281, 0.08539962768554688, 0.09193992614746094, 0.098480224609375, 0.10502052307128906, 0.11156082153320312, 0.11810111999511719, 0.12464141845703125, 0.1311817169189453, 0.13772201538085938, 0.14426231384277344, 0.1508026123046875, 0.15734291076660156, 0.16388320922851562, 0.1704235076904297, 0.17696380615234375, 0.1835041046142578, 0.19004440307617188, 0.19658470153808594, 0.203125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 4.0, 17.0, 54.0, 100.0, 158.0, 239.0, 200.0, 118.0, 68.0, 24.0, 12.0, 9.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4945473670959473, -2.4410018920898438, -2.3874564170837402, -2.3339109420776367, -2.280365467071533, -2.2268199920654297, -2.173274517059326, -2.1197290420532227, -2.06618332862854, -2.0126378536224365, -1.959092378616333, -1.9055469036102295, -1.8520013093948364, -1.798455834388733, -1.7449103593826294, -1.6913648843765259, -1.637819528579712, -1.5842740535736084, -1.5307285785675049, -1.4771831035614014, -1.4236375093460083, -1.3700920343399048, -1.3165465593338013, -1.2630010843276978, -1.2094554901123047, -1.1559100151062012, -1.1023645401000977, -1.0488190650939941, -0.9952735304832458, -0.9417279958724976, -0.888182520866394, -0.8346370458602905, -0.7810916304588318, -0.7275461554527283, -0.67400062084198, -0.6204551458358765, -0.566909670829773, -0.5133641958236694, -0.45981866121292114, -0.4062731862068176, -0.3527276813983917, -0.2991821765899658, -0.2456367015838623, -0.1920911967754364, -0.1385457068681717, -0.08500021696090698, -0.03145471215248108, 0.022090762853622437, 0.07563626766204834, 0.12918175756931305, 0.18272724747657776, 0.23627275228500366, 0.2898182272911072, 0.3433637320995331, 0.396909236907959, 0.4504547119140625, 0.504000186920166, 0.5575456619262695, 0.6110911965370178, 0.6646366715431213, 0.7181821465492249, 0.7717276811599731, 0.8252731561660767, 0.8788186311721802, 0.9323641657829285]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 6.0, 4.0, 5.0, 5.0, 10.0, 13.0, 13.0, 20.0, 25.0, 37.0, 48.0, 51.0, 56.0, 64.0, 73.0, 69.0, 64.0, 53.0, 68.0, 51.0, 54.0, 56.0, 31.0, 31.0, 29.0, 23.0, 13.0, 15.0, 5.0, 5.0, 5.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4739203155040741, -0.45512574911117554, -0.4363311529159546, -0.41753658652305603, -0.39874202013015747, -0.3799474537372589, -0.36115288734436035, -0.3423582911491394, -0.32356372475624084, -0.3047691583633423, -0.28597456216812134, -0.2671799957752228, -0.24838542938232422, -0.22959086298942566, -0.2107962816953659, -0.19200170040130615, -0.1732071340084076, -0.15441256761550903, -0.13561798632144928, -0.11682341247797012, -0.09802883863449097, -0.07923426479101181, -0.060439690947532654, -0.0416451096534729, -0.02285054326057434, -0.004055969417095184, 0.014738604426383972, 0.03353317826986313, 0.052327752113342285, 0.07112232595682144, 0.0899168998003006, 0.10871148109436035, 0.1275060772895813, 0.14630064368247986, 0.1650952249765396, 0.18388980627059937, 0.20268437266349792, 0.22147893905639648, 0.24027352035045624, 0.259068101644516, 0.27786266803741455, 0.2966572344303131, 0.31545180082321167, 0.3342463970184326, 0.3530409634113312, 0.37183552980422974, 0.3906301259994507, 0.40942469239234924, 0.4282192587852478, 0.44701382517814636, 0.4658083915710449, 0.48460298776626587, 0.5033975839614868, 0.522192120552063, 0.5409867167472839, 0.5597813129425049, 0.578575849533081, 0.597370445728302, 0.6161649823188782, 0.6349595785140991, 0.6537541151046753, 0.6725487112998962, 0.6913433074951172, 0.7101378440856934, 0.7289324402809143]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 2.0, 4.0, 7.0, 5.0, 15.0, 20.0, 83.0, 246.0, 1053.0, 5538.0, 96439.0, 913103.0, 27928.0, 3246.0, 667.0, 129.0, 41.0, 11.0, 9.0, 5.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53369140625, -0.5201263427734375, -0.506561279296875, -0.4929962158203125, -0.47943115234375, -0.4658660888671875, -0.452301025390625, -0.4387359619140625, -0.4251708984375, -0.4116058349609375, -0.398040771484375, -0.3844757080078125, -0.37091064453125, -0.3573455810546875, -0.343780517578125, -0.3302154541015625, -0.316650390625, -0.3030853271484375, -0.289520263671875, -0.2759552001953125, -0.26239013671875, -0.2488250732421875, -0.235260009765625, -0.2216949462890625, -0.2081298828125, -0.1945648193359375, -0.180999755859375, -0.1674346923828125, -0.15386962890625, -0.1403045654296875, -0.126739501953125, -0.1131744384765625, -0.099609375, -0.0860443115234375, -0.072479248046875, -0.0589141845703125, -0.04534912109375, -0.0317840576171875, -0.018218994140625, -0.0046539306640625, 0.0089111328125, 0.0224761962890625, 0.036041259765625, 0.0496063232421875, 0.06317138671875, 0.0767364501953125, 0.090301513671875, 0.1038665771484375, 0.117431640625, 0.1309967041015625, 0.144561767578125, 0.1581268310546875, 0.17169189453125, 0.1852569580078125, 0.198822021484375, 0.2123870849609375, 0.2259521484375, 0.2395172119140625, 0.253082275390625, 0.2666473388671875, 0.28021240234375, 0.2937774658203125, 0.307342529296875, 0.3209075927734375, 0.33447265625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 3.0, 7.0, 8.0, 6.0, 13.0, 22.0, 24.0, 37.0, 35.0, 46.0, 67.0, 82.0, 85.0, 87.0, 62.0, 56.0, 73.0, 68.0, 54.0, 41.0, 34.0, 31.0, 17.0, 17.0, 9.0, 7.0, 5.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.392578125, -0.378570556640625, -0.36456298828125, -0.350555419921875, -0.3365478515625, -0.322540283203125, -0.30853271484375, -0.294525146484375, -0.280517578125, -0.266510009765625, -0.25250244140625, -0.238494873046875, -0.2244873046875, -0.210479736328125, -0.19647216796875, -0.182464599609375, -0.16845703125, -0.154449462890625, -0.14044189453125, -0.126434326171875, -0.1124267578125, -0.098419189453125, -0.08441162109375, -0.070404052734375, -0.056396484375, -0.042388916015625, -0.02838134765625, -0.014373779296875, -0.0003662109375, 0.013641357421875, 0.02764892578125, 0.041656494140625, 0.0556640625, 0.069671630859375, 0.08367919921875, 0.097686767578125, 0.1116943359375, 0.125701904296875, 0.13970947265625, 0.153717041015625, 0.167724609375, 0.181732177734375, 0.19573974609375, 0.209747314453125, 0.2237548828125, 0.237762451171875, 0.25177001953125, 0.265777587890625, 0.27978515625, 0.293792724609375, 0.30780029296875, 0.321807861328125, 0.3358154296875, 0.349822998046875, 0.36383056640625, 0.377838134765625, 0.391845703125, 0.405853271484375, 0.41986083984375, 0.433868408203125, 0.4478759765625, 0.461883544921875, 0.47589111328125, 0.489898681640625, 0.50390625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 8.0, 8.0, 5.0, 8.0, 17.0, 24.0, 38.0, 32.0, 68.0, 84.0, 150.0, 234.0, 344.0, 604.0, 935.0, 1664.0, 2983.0, 5873.0, 14535.0, 54841.0, 258164.0, 481972.0, 168240.0, 35921.0, 11022.0, 4687.0, 2510.0, 1400.0, 807.0, 512.0, 307.0, 197.0, 109.0, 70.0, 52.0, 37.0, 23.0, 25.0, 8.0, 9.0, 7.0, 8.0, 6.0, 3.0, 4.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09942626953125, -0.096038818359375, -0.0926513671875, -0.089263916015625, -0.08587646484375, -0.082489013671875, -0.0791015625, -0.075714111328125, -0.07232666015625, -0.068939208984375, -0.0655517578125, -0.062164306640625, -0.05877685546875, -0.055389404296875, -0.052001953125, -0.048614501953125, -0.04522705078125, -0.041839599609375, -0.0384521484375, -0.035064697265625, -0.03167724609375, -0.028289794921875, -0.02490234375, -0.021514892578125, -0.01812744140625, -0.014739990234375, -0.0113525390625, -0.007965087890625, -0.00457763671875, -0.001190185546875, 0.002197265625, 0.005584716796875, 0.00897216796875, 0.012359619140625, 0.0157470703125, 0.019134521484375, 0.02252197265625, 0.025909423828125, 0.029296875, 0.032684326171875, 0.03607177734375, 0.039459228515625, 0.0428466796875, 0.046234130859375, 0.04962158203125, 0.053009033203125, 0.056396484375, 0.059783935546875, 0.06317138671875, 0.066558837890625, 0.0699462890625, 0.073333740234375, 0.07672119140625, 0.080108642578125, 0.08349609375, 0.086883544921875, 0.09027099609375, 0.093658447265625, 0.0970458984375, 0.100433349609375, 0.10382080078125, 0.107208251953125, 0.110595703125, 0.113983154296875, 0.11737060546875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 3.0, 2.0, 5.0, 5.0, 5.0, 4.0, 4.0, 10.0, 11.0, 20.0, 19.0, 15.0, 16.0, 20.0, 29.0, 29.0, 25.0, 37.0, 30.0, 43.0, 38.0, 45.0, 50.0, 47.0, 41.0, 53.0, 54.0, 32.0, 50.0, 31.0, 32.0, 35.0, 26.0, 24.0, 10.0, 14.0, 15.0, 18.0, 14.0, 12.0, 5.0, 7.0, 7.0, 5.0, 2.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.515625, -0.49910736083984375, -0.4825897216796875, -0.46607208251953125, -0.449554443359375, -0.43303680419921875, -0.4165191650390625, -0.40000152587890625, -0.38348388671875, -0.36696624755859375, -0.3504486083984375, -0.33393096923828125, -0.317413330078125, -0.30089569091796875, -0.2843780517578125, -0.26786041259765625, -0.2513427734375, -0.23482513427734375, -0.2183074951171875, -0.20178985595703125, -0.185272216796875, -0.16875457763671875, -0.1522369384765625, -0.13571929931640625, -0.11920166015625, -0.10268402099609375, -0.0861663818359375, -0.06964874267578125, -0.053131103515625, -0.03661346435546875, -0.0200958251953125, -0.00357818603515625, 0.012939453125, 0.02945709228515625, 0.0459747314453125, 0.06249237060546875, 0.079010009765625, 0.09552764892578125, 0.1120452880859375, 0.12856292724609375, 0.14508056640625, 0.16159820556640625, 0.1781158447265625, 0.19463348388671875, 0.211151123046875, 0.22766876220703125, 0.2441864013671875, 0.26070404052734375, 0.2772216796875, 0.29373931884765625, 0.3102569580078125, 0.32677459716796875, 0.343292236328125, 0.35980987548828125, 0.3763275146484375, 0.39284515380859375, 0.40936279296875, 0.42588043212890625, 0.4423980712890625, 0.45891571044921875, 0.475433349609375, 0.49195098876953125, 0.5084686279296875, 0.5249862670898438, 0.54150390625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 2.0, 1.0, 4.0, 8.0, 15.0, 13.0, 15.0, 21.0, 37.0, 66.0, 92.0, 179.0, 271.0, 464.0, 853.0, 1620.0, 3412.0, 7745.0, 21429.0, 69332.0, 238705.0, 416689.0, 199057.0, 57618.0, 18164.0, 6615.0, 2797.0, 1446.0, 769.0, 427.0, 229.0, 157.0, 92.0, 63.0, 59.0, 24.0, 17.0, 15.0, 7.0, 8.0, 6.0, 5.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.0312347412109375, -0.030327320098876953, -0.029419898986816406, -0.02851247787475586, -0.027605056762695312, -0.026697635650634766, -0.02579021453857422, -0.024882793426513672, -0.023975372314453125, -0.023067951202392578, -0.02216053009033203, -0.021253108978271484, -0.020345687866210938, -0.01943826675415039, -0.018530845642089844, -0.017623424530029297, -0.01671600341796875, -0.015808582305908203, -0.014901161193847656, -0.01399374008178711, -0.013086318969726562, -0.012178897857666016, -0.011271476745605469, -0.010364055633544922, -0.009456634521484375, -0.008549213409423828, -0.007641792297363281, -0.006734371185302734, -0.0058269500732421875, -0.004919528961181641, -0.004012107849121094, -0.003104686737060547, -0.002197265625, -0.0012898445129394531, -0.00038242340087890625, 0.0005249977111816406, 0.0014324188232421875, 0.0023398399353027344, 0.0032472610473632812, 0.004154682159423828, 0.005062103271484375, 0.005969524383544922, 0.006876945495605469, 0.007784366607666016, 0.008691787719726562, 0.00959920883178711, 0.010506629943847656, 0.011414051055908203, 0.01232147216796875, 0.013228893280029297, 0.014136314392089844, 0.01504373550415039, 0.015951156616210938, 0.016858577728271484, 0.01776599884033203, 0.018673419952392578, 0.019580841064453125, 0.020488262176513672, 0.02139568328857422, 0.022303104400634766, 0.023210525512695312, 0.02411794662475586, 0.025025367736816406, 0.025932788848876953, 0.0268402099609375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 7.0, 2.0, 12.0, 10.0, 11.0, 15.0, 20.0, 21.0, 27.0, 35.0, 50.0, 64.0, 88.0, 73.0, 121.0, 104.0, 65.0, 74.0, 57.0, 41.0, 30.0, 21.0, 10.0, 15.0, 7.0, 4.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.621246337890625e-05, -1.569557934999466e-05, -1.5178695321083069e-05, -1.4661811292171478e-05, -1.4144927263259888e-05, -1.3628043234348297e-05, -1.3111159205436707e-05, -1.2594275176525116e-05, -1.2077391147613525e-05, -1.1560507118701935e-05, -1.1043623089790344e-05, -1.0526739060878754e-05, -1.0009855031967163e-05, -9.492971003055573e-06, -8.976086974143982e-06, -8.459202945232391e-06, -7.9423189163208e-06, -7.42543488740921e-06, -6.90855085849762e-06, -6.391666829586029e-06, -5.8747828006744385e-06, -5.357898771762848e-06, -4.841014742851257e-06, -4.324130713939667e-06, -3.807246685028076e-06, -3.2903626561164856e-06, -2.773478627204895e-06, -2.2565945982933044e-06, -1.7397105693817139e-06, -1.2228265404701233e-06, -7.059425115585327e-07, -1.8905848264694214e-07, 3.2782554626464844e-07, 8.44709575176239e-07, 1.3615936040878296e-06, 1.8784776329994202e-06, 2.3953616619110107e-06, 2.9122456908226013e-06, 3.429129719734192e-06, 3.9460137486457825e-06, 4.462897777557373e-06, 4.979781806468964e-06, 5.496665835380554e-06, 6.013549864292145e-06, 6.530433893203735e-06, 7.047317922115326e-06, 7.5642019510269165e-06, 8.081085979938507e-06, 8.597970008850098e-06, 9.114854037761688e-06, 9.631738066673279e-06, 1.014862209558487e-05, 1.066550612449646e-05, 1.118239015340805e-05, 1.1699274182319641e-05, 1.2216158211231232e-05, 1.2733042240142822e-05, 1.3249926269054413e-05, 1.3766810297966003e-05, 1.4283694326877594e-05, 1.4800578355789185e-05, 1.5317462384700775e-05, 1.5834346413612366e-05, 1.6351230442523956e-05, 1.6868114471435547e-05]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 6.0, 2.0, 2.0, 5.0, 5.0, 10.0, 18.0, 15.0, 24.0, 35.0, 48.0, 67.0, 90.0, 139.0, 267.0, 437.0, 938.0, 2127.0, 5692.0, 17192.0, 60601.0, 219329.0, 417200.0, 230748.0, 64740.0, 18171.0, 6132.0, 2287.0, 1029.0, 471.0, 286.0, 151.0, 89.0, 83.0, 46.0, 19.0, 14.0, 11.0, 12.0, 9.0, 2.0, 5.0, 6.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0308074951171875, -0.029830217361450195, -0.02885293960571289, -0.027875661849975586, -0.02689838409423828, -0.025921106338500977, -0.024943828582763672, -0.023966550827026367, -0.022989273071289062, -0.022011995315551758, -0.021034717559814453, -0.02005743980407715, -0.019080162048339844, -0.01810288429260254, -0.017125606536865234, -0.01614832878112793, -0.015171051025390625, -0.01419377326965332, -0.013216495513916016, -0.012239217758178711, -0.011261940002441406, -0.010284662246704102, -0.009307384490966797, -0.008330106735229492, -0.0073528289794921875, -0.006375551223754883, -0.005398273468017578, -0.0044209957122802734, -0.0034437179565429688, -0.002466440200805664, -0.0014891624450683594, -0.0005118846893310547, 0.00046539306640625, 0.0014426708221435547, 0.0024199485778808594, 0.003397226333618164, 0.004374504089355469, 0.0053517818450927734, 0.006329059600830078, 0.007306337356567383, 0.008283615112304688, 0.009260892868041992, 0.010238170623779297, 0.011215448379516602, 0.012192726135253906, 0.013170003890991211, 0.014147281646728516, 0.01512455940246582, 0.016101837158203125, 0.01707911491394043, 0.018056392669677734, 0.01903367042541504, 0.020010948181152344, 0.02098822593688965, 0.021965503692626953, 0.022942781448364258, 0.023920059204101562, 0.024897336959838867, 0.025874614715576172, 0.026851892471313477, 0.02782917022705078, 0.028806447982788086, 0.02978372573852539, 0.030761003494262695, 0.03173828125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 7.0, 8.0, 10.0, 9.0, 7.0, 14.0, 20.0, 9.0, 21.0, 29.0, 34.0, 37.0, 37.0, 58.0, 50.0, 57.0, 46.0, 55.0, 50.0, 59.0, 33.0, 51.0, 45.0, 41.0, 38.0, 32.0, 20.0, 25.0, 24.0, 22.0, 12.0, 6.0, 9.0, 4.0, 6.0, 4.0, 3.0, 5.0, 3.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.007419586181640625, -0.007188856601715088, -0.006958127021789551, -0.006727397441864014, -0.0064966678619384766, -0.0062659382820129395, -0.006035208702087402, -0.005804479122161865, -0.005573749542236328, -0.005343019962310791, -0.005112290382385254, -0.004881560802459717, -0.00465083122253418, -0.004420101642608643, -0.0041893720626831055, -0.003958642482757568, -0.0037279129028320312, -0.003497183322906494, -0.003266453742980957, -0.00303572416305542, -0.002804994583129883, -0.0025742650032043457, -0.0023435354232788086, -0.0021128058433532715, -0.0018820762634277344, -0.0016513466835021973, -0.0014206171035766602, -0.001189887523651123, -0.0009591579437255859, -0.0007284283638000488, -0.0004976987838745117, -0.0002669692039489746, -3.62396240234375e-05, 0.0001944899559020996, 0.0004252195358276367, 0.0006559491157531738, 0.0008866786956787109, 0.001117408275604248, 0.0013481378555297852, 0.0015788674354553223, 0.0018095970153808594, 0.0020403265953063965, 0.0022710561752319336, 0.0025017857551574707, 0.002732515335083008, 0.002963244915008545, 0.003193974494934082, 0.003424704074859619, 0.0036554336547851562, 0.0038861632347106934, 0.0041168928146362305, 0.004347622394561768, 0.004578351974487305, 0.004809081554412842, 0.005039811134338379, 0.005270540714263916, 0.005501270294189453, 0.00573199987411499, 0.005962729454040527, 0.0061934590339660645, 0.0064241886138916016, 0.006654918193817139, 0.006885647773742676, 0.007116377353668213, 0.00734710693359375]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 11.0, 80.0, 377.0, 440.0, 82.0, 19.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4104955196380615, -3.3347394466400146, -3.258983612060547, -3.1832275390625, -3.107471466064453, -3.0317153930664062, -2.9559593200683594, -2.8802034854888916, -2.8044474124908447, -2.728691339492798, -2.65293550491333, -2.577179431915283, -2.5014233589172363, -2.4256672859191895, -2.3499112129211426, -2.274155378341675, -2.198399305343628, -2.122643232345581, -2.0468873977661133, -1.9711313247680664, -1.8953752517700195, -1.8196191787719727, -1.7438632249832153, -1.668107271194458, -1.5923511981964111, -1.5165951251983643, -1.440839171409607, -1.3650832176208496, -1.2893271446228027, -1.2135710716247559, -1.1378151178359985, -1.0620591640472412, -0.9863032102584839, -0.9105471968650818, -0.8347911834716797, -0.7590351700782776, -0.6832791566848755, -0.6075231432914734, -0.5317671298980713, -0.4560111165046692, -0.3802551031112671, -0.304499089717865, -0.2287430763244629, -0.1529870629310608, -0.07723104953765869, -0.0014750361442565918, 0.07428097724914551, 0.1500369906425476, 0.2257930040359497, 0.3015490174293518, 0.3773050308227539, 0.453061044216156, 0.5288170576095581, 0.6045730710029602, 0.6803290843963623, 0.7560850977897644, 0.8318411111831665, 0.9075971245765686, 0.9833531379699707, 1.0591092109680176, 1.134865164756775, 1.2106211185455322, 1.286377191543579, 1.362133264541626, 1.4378892183303833]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 5.0, 6.0, 7.0, 7.0, 18.0, 24.0, 34.0, 55.0, 56.0, 77.0, 98.0, 83.0, 98.0, 77.0, 86.0, 64.0, 65.0, 48.0, 31.0, 29.0, 14.0, 8.0, 5.0, 9.0, 1.0, 0.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.34692132472991943, -0.33067426085472107, -0.3144271969795227, -0.29818010330200195, -0.2819330394268036, -0.2656859755516052, -0.24943889677524567, -0.2331918179988861, -0.21694475412368774, -0.20069769024848938, -0.18445061147212982, -0.16820353269577026, -0.1519564688205719, -0.13570940494537354, -0.11946232616901398, -0.10321525484323502, -0.08696818351745605, -0.0707211121916771, -0.05447404086589813, -0.03822696954011917, -0.02197989821434021, -0.005732826888561249, 0.010514244437217712, 0.026761315762996674, 0.043008387088775635, 0.059255458414554596, 0.07550252974033356, 0.09174960106611252, 0.10799667239189148, 0.12424374371767044, 0.1404908150434494, 0.15673789381980896, 0.1729850172996521, 0.18923208117485046, 0.20547915995121002, 0.22172623872756958, 0.23797330260276794, 0.2542203664779663, 0.27046746015548706, 0.2867145240306854, 0.3029615879058838, 0.31920865178108215, 0.3354557156562805, 0.35170280933380127, 0.36794987320899963, 0.384196937084198, 0.40044403076171875, 0.4166910946369171, 0.4329381585121155, 0.44918522238731384, 0.4654322862625122, 0.48167937994003296, 0.4979264438152313, 0.5141735076904297, 0.5304206013679504, 0.5466676354408264, 0.5629147291183472, 0.5791618227958679, 0.5954088568687439, 0.6116559505462646, 0.6279029846191406, 0.6441500782966614, 0.6603971719741821, 0.6766442060470581, 0.6928912997245789]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 7.0, 4.0, 5.0, 4.0, 7.0, 11.0, 22.0, 14.0, 33.0, 48.0, 62.0, 99.0, 178.0, 291.0, 562.0, 1106.0, 2207.0, 5366.0, 15084.0, 48032.0, 325398.0, 553947.0, 64402.0, 19312.0, 6896.0, 2703.0, 1247.0, 661.0, 304.0, 174.0, 132.0, 92.0, 48.0, 39.0, 19.0, 12.0, 9.0, 8.0, 2.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.362060546875, -0.35003662109375, -0.3380126953125, -0.32598876953125, -0.31396484375, -0.30194091796875, -0.2899169921875, -0.27789306640625, -0.265869140625, -0.25384521484375, -0.2418212890625, -0.22979736328125, -0.2177734375, -0.20574951171875, -0.1937255859375, -0.18170166015625, -0.169677734375, -0.15765380859375, -0.1456298828125, -0.13360595703125, -0.12158203125, -0.10955810546875, -0.0975341796875, -0.08551025390625, -0.073486328125, -0.06146240234375, -0.0494384765625, -0.03741455078125, -0.025390625, -0.01336669921875, -0.0013427734375, 0.01068115234375, 0.022705078125, 0.03472900390625, 0.0467529296875, 0.05877685546875, 0.07080078125, 0.08282470703125, 0.0948486328125, 0.10687255859375, 0.118896484375, 0.13092041015625, 0.1429443359375, 0.15496826171875, 0.1669921875, 0.17901611328125, 0.1910400390625, 0.20306396484375, 0.215087890625, 0.22711181640625, 0.2391357421875, 0.25115966796875, 0.26318359375, 0.27520751953125, 0.2872314453125, 0.29925537109375, 0.311279296875, 0.32330322265625, 0.3353271484375, 0.34735107421875, 0.359375, 0.37139892578125, 0.3834228515625, 0.39544677734375, 0.407470703125]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 7.0, 8.0, 8.0, 10.0, 21.0, 36.0, 32.0, 56.0, 63.0, 74.0, 90.0, 94.0, 81.0, 76.0, 72.0, 67.0, 54.0, 43.0, 31.0, 38.0, 14.0, 11.0, 4.0, 6.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.7587890625, -0.7298431396484375, -0.700897216796875, -0.6719512939453125, -0.64300537109375, -0.6140594482421875, -0.585113525390625, -0.5561676025390625, -0.5272216796875, -0.4982757568359375, -0.469329833984375, -0.4403839111328125, -0.41143798828125, -0.3824920654296875, -0.353546142578125, -0.3246002197265625, -0.295654296875, -0.2667083740234375, -0.237762451171875, -0.2088165283203125, -0.17987060546875, -0.1509246826171875, -0.121978759765625, -0.0930328369140625, -0.0640869140625, -0.0351409912109375, -0.006195068359375, 0.0227508544921875, 0.05169677734375, 0.0806427001953125, 0.109588623046875, 0.1385345458984375, 0.16748046875, 0.1964263916015625, 0.225372314453125, 0.2543182373046875, 0.28326416015625, 0.3122100830078125, 0.341156005859375, 0.3701019287109375, 0.3990478515625, 0.4279937744140625, 0.456939697265625, 0.4858856201171875, 0.51483154296875, 0.5437774658203125, 0.572723388671875, 0.6016693115234375, 0.630615234375, 0.6595611572265625, 0.688507080078125, 0.7174530029296875, 0.74639892578125, 0.7753448486328125, 0.804290771484375, 0.8332366943359375, 0.8621826171875, 0.8911285400390625, 0.920074462890625, 0.9490203857421875, 0.97796630859375, 1.0069122314453125, 1.035858154296875, 1.0648040771484375, 1.09375]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 8.0, 6.0, 10.0, 12.0, 16.0, 8.0, 24.0, 25.0, 33.0, 39.0, 49.0, 76.0, 86.0, 93.0, 144.0, 190.0, 264.0, 401.0, 831.0, 2680.0, 18356.0, 399937.0, 597362.0, 22287.0, 3113.0, 880.0, 447.0, 300.0, 193.0, 151.0, 112.0, 95.0, 68.0, 53.0, 42.0, 34.0, 37.0, 18.0, 8.0, 14.0, 18.0, 7.0, 7.0, 6.0, 6.0, 3.0, 2.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.6474609375, -0.6251678466796875, -0.602874755859375, -0.5805816650390625, -0.55828857421875, -0.5359954833984375, -0.513702392578125, -0.4914093017578125, -0.4691162109375, -0.4468231201171875, -0.424530029296875, -0.4022369384765625, -0.37994384765625, -0.3576507568359375, -0.335357666015625, -0.3130645751953125, -0.290771484375, -0.2684783935546875, -0.246185302734375, -0.2238922119140625, -0.20159912109375, -0.1793060302734375, -0.157012939453125, -0.1347198486328125, -0.1124267578125, -0.0901336669921875, -0.067840576171875, -0.0455474853515625, -0.02325439453125, -0.0009613037109375, 0.021331787109375, 0.0436248779296875, 0.06591796875, 0.0882110595703125, 0.110504150390625, 0.1327972412109375, 0.15509033203125, 0.1773834228515625, 0.199676513671875, 0.2219696044921875, 0.2442626953125, 0.2665557861328125, 0.288848876953125, 0.3111419677734375, 0.33343505859375, 0.3557281494140625, 0.378021240234375, 0.4003143310546875, 0.422607421875, 0.4449005126953125, 0.467193603515625, 0.4894866943359375, 0.51177978515625, 0.5340728759765625, 0.556365966796875, 0.5786590576171875, 0.6009521484375, 0.6232452392578125, 0.645538330078125, 0.6678314208984375, 0.69012451171875, 0.7124176025390625, 0.734710693359375, 0.7570037841796875, 0.779296875]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 3.0, 9.0, 5.0, 5.0, 10.0, 7.0, 17.0, 15.0, 14.0, 27.0, 22.0, 34.0, 49.0, 48.0, 47.0, 58.0, 63.0, 62.0, 55.0, 61.0, 64.0, 35.0, 34.0, 52.0, 25.0, 27.0, 27.0, 20.0, 15.0, 20.0, 13.0, 6.0, 11.0, 13.0, 8.0, 10.0, 3.0, 0.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.79833984375, -0.7741470336914062, -0.7499542236328125, -0.7257614135742188, -0.701568603515625, -0.6773757934570312, -0.6531829833984375, -0.6289901733398438, -0.60479736328125, -0.5806045532226562, -0.5564117431640625, -0.5322189331054688, -0.508026123046875, -0.48383331298828125, -0.4596405029296875, -0.43544769287109375, -0.4112548828125, -0.38706207275390625, -0.3628692626953125, -0.33867645263671875, -0.314483642578125, -0.29029083251953125, -0.2660980224609375, -0.24190521240234375, -0.21771240234375, -0.19351959228515625, -0.1693267822265625, -0.14513397216796875, -0.120941162109375, -0.09674835205078125, -0.0725555419921875, -0.04836273193359375, -0.024169921875, 2.288818359375e-05, 0.0242156982421875, 0.04840850830078125, 0.072601318359375, 0.09679412841796875, 0.1209869384765625, 0.14517974853515625, 0.16937255859375, 0.19356536865234375, 0.2177581787109375, 0.24195098876953125, 0.266143798828125, 0.29033660888671875, 0.3145294189453125, 0.33872222900390625, 0.3629150390625, 0.38710784912109375, 0.4113006591796875, 0.43549346923828125, 0.459686279296875, 0.48387908935546875, 0.5080718994140625, 0.5322647094726562, 0.55645751953125, 0.5806503295898438, 0.6048431396484375, 0.6290359497070312, 0.653228759765625, 0.6774215698242188, 0.7016143798828125, 0.7258071899414062, 0.75]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 4.0, 6.0, 11.0, 10.0, 27.0, 24.0, 52.0, 82.0, 112.0, 169.0, 294.0, 490.0, 1359.0, 7062.0, 808364.0, 223268.0, 4811.0, 1141.0, 492.0, 286.0, 146.0, 122.0, 76.0, 45.0, 44.0, 17.0, 19.0, 4.0, 4.0, 1.0, 5.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0], "bins": [-0.5712890625, -0.5576591491699219, -0.5440292358398438, -0.5303993225097656, -0.5167694091796875, -0.5031394958496094, -0.48950958251953125, -0.4758796691894531, -0.462249755859375, -0.4486198425292969, -0.43498992919921875, -0.4213600158691406, -0.4077301025390625, -0.3941001892089844, -0.38047027587890625, -0.3668403625488281, -0.35321044921875, -0.3395805358886719, -0.32595062255859375, -0.3123207092285156, -0.2986907958984375, -0.2850608825683594, -0.27143096923828125, -0.2578010559082031, -0.244171142578125, -0.23054122924804688, -0.21691131591796875, -0.20328140258789062, -0.1896514892578125, -0.17602157592773438, -0.16239166259765625, -0.14876174926757812, -0.1351318359375, -0.12150192260742188, -0.10787200927734375, -0.09424209594726562, -0.0806121826171875, -0.06698226928710938, -0.05335235595703125, -0.039722442626953125, -0.026092529296875, -0.012462615966796875, 0.00116729736328125, 0.014797210693359375, 0.0284271240234375, 0.042057037353515625, 0.05568695068359375, 0.06931686401367188, 0.08294677734375, 0.09657669067382812, 0.11020660400390625, 0.12383651733398438, 0.1374664306640625, 0.15109634399414062, 0.16472625732421875, 0.17835617065429688, 0.191986083984375, 0.20561599731445312, 0.21924591064453125, 0.23287582397460938, 0.2465057373046875, 0.2601356506347656, 0.27376556396484375, 0.2873954772949219, 0.301025390625]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 5.0, 6.0, 18.0, 50.0, 153.0, 559.0, 129.0, 46.0, 17.0, 9.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6193599700927734e-05, -4.337821155786514e-05, -4.056282341480255e-05, -3.774743527173996e-05, -3.493204712867737e-05, -3.2116658985614777e-05, -2.9301270842552185e-05, -2.6485882699489594e-05, -2.3670494556427002e-05, -2.085510641336441e-05, -1.803971827030182e-05, -1.5224330127239227e-05, -1.2408941984176636e-05, -9.593553841114044e-06, -6.778165698051453e-06, -3.962777554988861e-06, -1.1473894119262695e-06, 1.667998731136322e-06, 4.4833868741989136e-06, 7.298775017261505e-06, 1.0114163160324097e-05, 1.2929551303386688e-05, 1.574493944644928e-05, 1.856032758951187e-05, 2.1375715732574463e-05, 2.4191103875637054e-05, 2.7006492018699646e-05, 2.9821880161762238e-05, 3.263726830482483e-05, 3.545265644788742e-05, 3.826804459095001e-05, 4.1083432734012604e-05, 4.3898820877075195e-05, 4.671420902013779e-05, 4.952959716320038e-05, 5.234498530626297e-05, 5.516037344932556e-05, 5.797576159238815e-05, 6.0791149735450745e-05, 6.360653787851334e-05, 6.642192602157593e-05, 6.923731416463852e-05, 7.205270230770111e-05, 7.48680904507637e-05, 7.76834785938263e-05, 8.049886673688889e-05, 8.331425487995148e-05, 8.612964302301407e-05, 8.894503116607666e-05, 9.176041930913925e-05, 9.457580745220184e-05, 9.739119559526443e-05, 0.00010020658373832703, 0.00010302197188138962, 0.00010583736002445221, 0.0001086527481675148, 0.00011146813631057739, 0.00011428352445363998, 0.00011709891259670258, 0.00011991430073976517, 0.00012272968888282776, 0.00012554507702589035, 0.00012836046516895294, 0.00013117585331201553, 0.00013399124145507812]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 3.0, 5.0, 6.0, 3.0, 9.0, 5.0, 8.0, 21.0, 20.0, 29.0, 43.0, 48.0, 69.0, 106.0, 189.0, 231.0, 391.0, 745.0, 2246.0, 20026.0, 951936.0, 66099.0, 3951.0, 986.0, 497.0, 276.0, 216.0, 124.0, 83.0, 53.0, 41.0, 21.0, 21.0, 14.0, 14.0, 10.0, 5.0, 7.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3447265625, -0.33074951171875, -0.3167724609375, -0.30279541015625, -0.288818359375, -0.27484130859375, -0.2608642578125, -0.24688720703125, -0.23291015625, -0.21893310546875, -0.2049560546875, -0.19097900390625, -0.177001953125, -0.16302490234375, -0.1490478515625, -0.13507080078125, -0.12109375, -0.10711669921875, -0.0931396484375, -0.07916259765625, -0.065185546875, -0.05120849609375, -0.0372314453125, -0.02325439453125, -0.00927734375, 0.00469970703125, 0.0186767578125, 0.03265380859375, 0.046630859375, 0.06060791015625, 0.0745849609375, 0.08856201171875, 0.1025390625, 0.11651611328125, 0.1304931640625, 0.14447021484375, 0.158447265625, 0.17242431640625, 0.1864013671875, 0.20037841796875, 0.21435546875, 0.22833251953125, 0.2423095703125, 0.25628662109375, 0.270263671875, 0.28424072265625, 0.2982177734375, 0.31219482421875, 0.326171875, 0.34014892578125, 0.3541259765625, 0.36810302734375, 0.382080078125, 0.39605712890625, 0.4100341796875, 0.42401123046875, 0.43798828125, 0.45196533203125, 0.4659423828125, 0.47991943359375, 0.493896484375, 0.50787353515625, 0.5218505859375, 0.53582763671875, 0.5498046875]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 9.0, 10.0, 10.0, 15.0, 40.0, 44.0, 89.0, 194.0, 282.0, 137.0, 58.0, 41.0, 29.0, 14.0, 7.0, 10.0, 5.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11181640625, -0.10825538635253906, -0.10469436645507812, -0.10113334655761719, -0.09757232666015625, -0.09401130676269531, -0.09045028686523438, -0.08688926696777344, -0.0833282470703125, -0.07976722717285156, -0.07620620727539062, -0.07264518737792969, -0.06908416748046875, -0.06552314758300781, -0.061962127685546875, -0.05840110778808594, -0.054840087890625, -0.05127906799316406, -0.047718048095703125, -0.04415702819824219, -0.04059600830078125, -0.03703498840332031, -0.033473968505859375, -0.029912948608398438, -0.0263519287109375, -0.022790908813476562, -0.019229888916015625, -0.015668869018554688, -0.01210784912109375, -0.008546829223632812, -0.004985809326171875, -0.0014247894287109375, 0.00213623046875, 0.0056972503662109375, 0.009258270263671875, 0.012819290161132812, 0.01638031005859375, 0.019941329956054688, 0.023502349853515625, 0.027063369750976562, 0.0306243896484375, 0.03418540954589844, 0.037746429443359375, 0.04130744934082031, 0.04486846923828125, 0.04842948913574219, 0.051990509033203125, 0.05555152893066406, 0.059112548828125, 0.06267356872558594, 0.06623458862304688, 0.06979560852050781, 0.07335662841796875, 0.07691764831542969, 0.08047866821289062, 0.08403968811035156, 0.0876007080078125, 0.09116172790527344, 0.09472274780273438, 0.09828376770019531, 0.10184478759765625, 0.10540580749511719, 0.10896682739257812, 0.11252784729003906, 0.1160888671875]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 23.0, 46.0, 114.0, 200.0, 239.0, 197.0, 99.0, 43.0, 24.0, 9.0, 4.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.612043857574463, -2.543992519378662, -2.4759409427642822, -2.4078896045684814, -2.3398382663726807, -2.271786689758301, -2.2037353515625, -2.135684013366699, -2.0676324367523193, -1.999580979347229, -1.9315296411514282, -1.863478183746338, -1.7954267263412476, -1.7273752689361572, -1.6593239307403564, -1.5912724733352661, -1.5232211351394653, -1.455169677734375, -1.3871183395385742, -1.3190668821334839, -1.2510154247283936, -1.1829640865325928, -1.1149126291275024, -1.046861171722412, -0.9788097739219666, -0.910758376121521, -0.8427069187164307, -0.7746555209159851, -0.7066041231155396, -0.6385526657104492, -0.5705012679100037, -0.5024498701095581, -0.4343982934951782, -0.3663468658924103, -0.29829543828964233, -0.23024404048919678, -0.16219261288642883, -0.09414118528366089, -0.026089787483215332, 0.04196164011955261, 0.11001306772232056, 0.1780644953250885, 0.24611590802669525, 0.314167320728302, 0.38221874833106995, 0.4502701759338379, 0.5183215737342834, 0.586372971534729, 0.6544244289398193, 0.7224758267402649, 0.7905272841453552, 0.8585786819458008, 0.9266301393508911, 0.9946815371513367, 1.0627329349517822, 1.1307843923568726, 1.198835849761963, 1.2668873071670532, 1.334938645362854, 1.4029901027679443, 1.4710415601730347, 1.539093017578125, 1.6071443557739258, 1.6751958131790161, 1.743247151374817]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 5.0, 3.0, 1.0, 2.0, 4.0, 9.0, 6.0, 5.0, 7.0, 7.0, 9.0, 10.0, 18.0, 26.0, 28.0, 23.0, 25.0, 37.0, 26.0, 45.0, 34.0, 41.0, 47.0, 37.0, 47.0, 42.0, 34.0, 44.0, 48.0, 41.0, 39.0, 46.0, 30.0, 27.0, 28.0, 23.0, 15.0, 22.0, 15.0, 13.0, 5.0, 12.0, 7.0, 6.0, 1.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-1.0844839811325073, -1.0528457164764404, -1.0212074518203735, -0.9895691275596619, -0.9579308032989502, -0.9262925386428833, -0.8946542739868164, -0.8630160093307495, -0.8313776850700378, -0.799739420413971, -0.7681010961532593, -0.7364628314971924, -0.7048245668411255, -0.6731862425804138, -0.6415479779243469, -0.6099096536636353, -0.5782713890075684, -0.5466331243515015, -0.5149948000907898, -0.4833565354347229, -0.4517182409763336, -0.42007994651794434, -0.38844168186187744, -0.35680338740348816, -0.3251650929450989, -0.2935267984867096, -0.2618885040283203, -0.23025023937225342, -0.19861194491386414, -0.16697365045547485, -0.13533537089824677, -0.10369709134101868, -0.0720587968826294, -0.04042050987482071, -0.008782222867012024, 0.02285606414079666, 0.05449435114860535, 0.08613264560699463, 0.11777092516422272, 0.1494092047214508, 0.1810474991798401, 0.21268579363822937, 0.24432407319545746, 0.27596235275268555, 0.30760064721107483, 0.3392389416694641, 0.370877206325531, 0.4025155007839203, 0.43415379524230957, 0.46579208970069885, 0.49743038415908813, 0.529068648815155, 0.5607069730758667, 0.5923452377319336, 0.6239835023880005, 0.6556217670440674, 0.687260091304779, 0.718898355960846, 0.7505366802215576, 0.7821749448776245, 0.8138132095336914, 0.8454515337944031, 0.87708979845047, 0.9087281227111816, 0.9403663873672485]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 3.0, 5.0, 9.0, 4.0, 5.0, 10.0, 15.0, 7.0, 10.0, 8.0, 20.0, 22.0, 25.0, 28.0, 39.0, 47.0, 59.0, 105.0, 199.0, 606.0, 2646.0, 63580.0, 4069588.0, 53486.0, 2598.0, 559.0, 191.0, 86.0, 61.0, 46.0, 32.0, 24.0, 23.0, 19.0, 12.0, 24.0, 18.0, 11.0, 12.0, 6.0, 10.0, 10.0, 5.0, 4.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.84375, -1.785186767578125, -1.72662353515625, -1.668060302734375, -1.6094970703125, -1.550933837890625, -1.49237060546875, -1.433807373046875, -1.375244140625, -1.316680908203125, -1.25811767578125, -1.199554443359375, -1.1409912109375, -1.082427978515625, -1.02386474609375, -0.965301513671875, -0.90673828125, -0.848175048828125, -0.78961181640625, -0.731048583984375, -0.6724853515625, -0.613922119140625, -0.55535888671875, -0.496795654296875, -0.438232421875, -0.379669189453125, -0.32110595703125, -0.262542724609375, -0.2039794921875, -0.145416259765625, -0.08685302734375, -0.028289794921875, 0.0302734375, 0.088836669921875, 0.14739990234375, 0.205963134765625, 0.2645263671875, 0.323089599609375, 0.38165283203125, 0.440216064453125, 0.498779296875, 0.557342529296875, 0.61590576171875, 0.674468994140625, 0.7330322265625, 0.791595458984375, 0.85015869140625, 0.908721923828125, 0.96728515625, 1.025848388671875, 1.08441162109375, 1.142974853515625, 1.2015380859375, 1.260101318359375, 1.31866455078125, 1.377227783203125, 1.435791015625, 1.494354248046875, 1.55291748046875, 1.611480712890625, 1.6700439453125, 1.728607177734375, 1.78717041015625, 1.845733642578125, 1.904296875]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 3.0, 0.0, 1.0, 4.0, 8.0, 7.0, 12.0, 16.0, 15.0, 21.0, 27.0, 34.0, 32.0, 44.0, 54.0, 67.0, 56.0, 64.0, 59.0, 63.0, 70.0, 51.0, 59.0, 46.0, 26.0, 38.0, 27.0, 21.0, 16.0, 11.0, 16.0, 9.0, 8.0, 9.0, 5.0, 5.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.429931640625, -0.4167518615722656, -0.40357208251953125, -0.3903923034667969, -0.3772125244140625, -0.3640327453613281, -0.35085296630859375, -0.3376731872558594, -0.324493408203125, -0.3113136291503906, -0.29813385009765625, -0.2849540710449219, -0.2717742919921875, -0.2585945129394531, -0.24541473388671875, -0.23223495483398438, -0.21905517578125, -0.20587539672851562, -0.19269561767578125, -0.17951583862304688, -0.1663360595703125, -0.15315628051757812, -0.13997650146484375, -0.12679672241210938, -0.113616943359375, -0.10043716430664062, -0.08725738525390625, -0.07407760620117188, -0.0608978271484375, -0.047718048095703125, -0.03453826904296875, -0.021358489990234375, -0.0081787109375, 0.005001068115234375, 0.01818084716796875, 0.031360626220703125, 0.0445404052734375, 0.057720184326171875, 0.07089996337890625, 0.08407974243164062, 0.097259521484375, 0.11043930053710938, 0.12361907958984375, 0.13679885864257812, 0.1499786376953125, 0.16315841674804688, 0.17633819580078125, 0.18951797485351562, 0.20269775390625, 0.21587753295898438, 0.22905731201171875, 0.24223709106445312, 0.2554168701171875, 0.2685966491699219, 0.28177642822265625, 0.2949562072753906, 0.308135986328125, 0.3213157653808594, 0.33449554443359375, 0.3476753234863281, 0.3608551025390625, 0.3740348815917969, 0.38721466064453125, 0.4003944396972656, 0.41357421875]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 8.0, 13.0, 10.0, 24.0, 70.0, 131.0, 410.0, 2034.0, 50873.0, 4095458.0, 42518.0, 2070.0, 394.0, 141.0, 64.0, 30.0, 19.0, 12.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1416015625, -1.0858612060546875, -1.030120849609375, -0.9743804931640625, -0.91864013671875, -0.8628997802734375, -0.807159423828125, -0.7514190673828125, -0.6956787109375, -0.6399383544921875, -0.584197998046875, -0.5284576416015625, -0.47271728515625, -0.4169769287109375, -0.361236572265625, -0.3054962158203125, -0.249755859375, -0.1940155029296875, -0.138275146484375, -0.0825347900390625, -0.02679443359375, 0.0289459228515625, 0.084686279296875, 0.1404266357421875, 0.1961669921875, 0.2519073486328125, 0.307647705078125, 0.3633880615234375, 0.41912841796875, 0.4748687744140625, 0.530609130859375, 0.5863494873046875, 0.64208984375, 0.6978302001953125, 0.753570556640625, 0.8093109130859375, 0.86505126953125, 0.9207916259765625, 0.976531982421875, 1.0322723388671875, 1.0880126953125, 1.1437530517578125, 1.199493408203125, 1.2552337646484375, 1.31097412109375, 1.3667144775390625, 1.422454833984375, 1.4781951904296875, 1.533935546875, 1.5896759033203125, 1.645416259765625, 1.7011566162109375, 1.75689697265625, 1.8126373291015625, 1.868377685546875, 1.9241180419921875, 1.9798583984375, 2.0355987548828125, 2.091339111328125, 2.1470794677734375, 2.20281982421875, 2.2585601806640625, 2.314300537109375, 2.3700408935546875, 2.42578125]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 8.0, 9.0, 8.0, 20.0, 29.0, 66.0, 154.0, 287.0, 630.0, 1154.0, 896.0, 439.0, 186.0, 102.0, 46.0, 19.0, 13.0, 10.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.48681640625, -0.47702980041503906, -0.4672431945800781, -0.4574565887451172, -0.44766998291015625, -0.4378833770751953, -0.4280967712402344, -0.41831016540527344, -0.4085235595703125, -0.39873695373535156, -0.3889503479003906, -0.3791637420654297, -0.36937713623046875, -0.3595905303955078, -0.3498039245605469, -0.34001731872558594, -0.330230712890625, -0.32044410705566406, -0.3106575012207031, -0.3008708953857422, -0.29108428955078125, -0.2812976837158203, -0.2715110778808594, -0.26172447204589844, -0.2519378662109375, -0.24215126037597656, -0.23236465454101562, -0.2225780487060547, -0.21279144287109375, -0.2030048370361328, -0.19321823120117188, -0.18343162536621094, -0.17364501953125, -0.16385841369628906, -0.15407180786132812, -0.1442852020263672, -0.13449859619140625, -0.12471199035644531, -0.11492538452148438, -0.10513877868652344, -0.0953521728515625, -0.08556556701660156, -0.07577896118164062, -0.06599235534667969, -0.05620574951171875, -0.04641914367675781, -0.036632537841796875, -0.026845932006835938, -0.017059326171875, -0.0072727203369140625, 0.002513885498046875, 0.012300491333007812, 0.02208709716796875, 0.03187370300292969, 0.041660308837890625, 0.05144691467285156, 0.0612335205078125, 0.07102012634277344, 0.08080673217773438, 0.09059333801269531, 0.10037994384765625, 0.11016654968261719, 0.11995315551757812, 0.12973976135253906, 0.1395263671875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 7.0, 6.0, 12.0, 27.0, 47.0, 68.0, 84.0, 127.0, 147.0, 161.0, 102.0, 96.0, 51.0, 29.0, 19.0, 12.0, 1.0, 3.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.293984293937683, -1.2637734413146973, -1.2335625886917114, -1.2033517360687256, -1.1731407642364502, -1.1429299116134644, -1.1127190589904785, -1.0825082063674927, -1.0522973537445068, -1.022086501121521, -0.9918756484985352, -0.9616647362709045, -0.9314538836479187, -0.9012430310249329, -0.8710321187973022, -0.8408212661743164, -0.8106104135513306, -0.7803995609283447, -0.7501887083053589, -0.7199777960777283, -0.6897669434547424, -0.6595560908317566, -0.629345178604126, -0.5991343259811401, -0.5689234733581543, -0.5387126207351685, -0.5085017681121826, -0.478290855884552, -0.44808000326156616, -0.4178691506385803, -0.3876582682132721, -0.35744738578796387, -0.32723647356033325, -0.2970256209373474, -0.2668147385120392, -0.23660387098789215, -0.20639300346374512, -0.17618213593959808, -0.14597126841545105, -0.11576040089130402, -0.08554953336715698, -0.05533866584300995, -0.025127798318862915, 0.005083069205284119, 0.03529393672943115, 0.06550480425357819, 0.09571567177772522, 0.12592653930187225, 0.1561374068260193, 0.18634827435016632, 0.21655914187431335, 0.2467700093984604, 0.2769808769226074, 0.30719172954559326, 0.3374026119709015, 0.3676134943962097, 0.39782434701919556, 0.4280351996421814, 0.4582460820674896, 0.48845696449279785, 0.5186678171157837, 0.5488786697387695, 0.5790895223617554, 0.609300434589386, 0.6395112872123718]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 7.0, 6.0, 8.0, 4.0, 14.0, 12.0, 18.0, 22.0, 28.0, 33.0, 29.0, 32.0, 32.0, 40.0, 42.0, 54.0, 66.0, 46.0, 52.0, 56.0, 43.0, 46.0, 53.0, 36.0, 36.0, 42.0, 26.0, 19.0, 24.0, 16.0, 17.0, 13.0, 5.0, 6.0, 8.0, 8.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.38227951526641846, -0.368903249502182, -0.35552698373794556, -0.3421507179737091, -0.32877445220947266, -0.3153982162475586, -0.30202195048332214, -0.2886456847190857, -0.27526941895484924, -0.2618931531906128, -0.24851688742637634, -0.2351406365633011, -0.22176437079906464, -0.20838810503482819, -0.19501185417175293, -0.18163558840751648, -0.16825932264328003, -0.15488305687904358, -0.14150679111480713, -0.12813054025173187, -0.11475427448749542, -0.10137800872325897, -0.08800175040960312, -0.07462549209594727, -0.061249226331710815, -0.047872964292764664, -0.03449670225381851, -0.02112044021487236, -0.0077441781759262085, 0.005632087588310242, 0.019008345901966095, 0.03238460421562195, 0.045760899782180786, 0.05913716182112694, 0.07251342386007309, 0.08588968217372894, 0.0992659479379654, 0.11264221370220184, 0.1260184645652771, 0.13939473032951355, 0.15277099609375, 0.16614726185798645, 0.1795235276222229, 0.19289977848529816, 0.2062760442495346, 0.21965231001377106, 0.2330285608768463, 0.24640482664108276, 0.2597810924053192, 0.27315735816955566, 0.2865336239337921, 0.29990988969802856, 0.3132861256599426, 0.32666242122650146, 0.3400386571884155, 0.353414922952652, 0.3667911887168884, 0.3801674544811249, 0.39354372024536133, 0.4069199860095978, 0.42029625177383423, 0.4336724877357483, 0.44704875349998474, 0.4604250192642212, 0.47380128502845764]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 8.0, 0.0, 5.0, 4.0, 6.0, 7.0, 11.0, 26.0, 54.0, 125.0, 416.0, 2088.0, 11373.0, 162061.0, 835448.0, 30825.0, 4753.0, 948.0, 223.0, 68.0, 41.0, 15.0, 13.0, 8.0, 3.0, 0.0, 5.0, 2.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.5966796875, -0.5806617736816406, -0.5646438598632812, -0.5486259460449219, -0.5326080322265625, -0.5165901184082031, -0.5005722045898438, -0.4845542907714844, -0.468536376953125, -0.4525184631347656, -0.43650054931640625, -0.4204826354980469, -0.4044647216796875, -0.3884468078613281, -0.37242889404296875, -0.3564109802246094, -0.34039306640625, -0.3243751525878906, -0.30835723876953125, -0.2923393249511719, -0.2763214111328125, -0.2603034973144531, -0.24428558349609375, -0.22826766967773438, -0.212249755859375, -0.19623184204101562, -0.18021392822265625, -0.16419601440429688, -0.1481781005859375, -0.13216018676757812, -0.11614227294921875, -0.10012435913085938, -0.0841064453125, -0.06808853149414062, -0.05207061767578125, -0.036052703857421875, -0.0200347900390625, -0.004016876220703125, 0.01200103759765625, 0.028018951416015625, 0.044036865234375, 0.060054779052734375, 0.07607269287109375, 0.09209060668945312, 0.1081085205078125, 0.12412643432617188, 0.14014434814453125, 0.15616226196289062, 0.17218017578125, 0.18819808959960938, 0.20421600341796875, 0.22023391723632812, 0.2362518310546875, 0.2522697448730469, 0.26828765869140625, 0.2843055725097656, 0.300323486328125, 0.3163414001464844, 0.33235931396484375, 0.3483772277832031, 0.3643951416015625, 0.3804130554199219, 0.39643096923828125, 0.4124488830566406, 0.428466796875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 7.0, 6.0, 10.0, 7.0, 21.0, 18.0, 18.0, 24.0, 24.0, 30.0, 31.0, 38.0, 37.0, 28.0, 47.0, 48.0, 61.0, 36.0, 56.0, 57.0, 53.0, 42.0, 45.0, 37.0, 37.0, 34.0, 17.0, 27.0, 22.0, 20.0, 16.0, 13.0, 6.0, 3.0, 6.0, 9.0, 6.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.265380859375, -0.25646209716796875, -0.2475433349609375, -0.23862457275390625, -0.229705810546875, -0.22078704833984375, -0.2118682861328125, -0.20294952392578125, -0.19403076171875, -0.18511199951171875, -0.1761932373046875, -0.16727447509765625, -0.158355712890625, -0.14943695068359375, -0.1405181884765625, -0.13159942626953125, -0.1226806640625, -0.11376190185546875, -0.1048431396484375, -0.09592437744140625, -0.087005615234375, -0.07808685302734375, -0.0691680908203125, -0.06024932861328125, -0.05133056640625, -0.04241180419921875, -0.0334930419921875, -0.02457427978515625, -0.015655517578125, -0.00673675537109375, 0.0021820068359375, 0.01110076904296875, 0.02001953125, 0.02893829345703125, 0.0378570556640625, 0.04677581787109375, 0.055694580078125, 0.06461334228515625, 0.0735321044921875, 0.08245086669921875, 0.09136962890625, 0.10028839111328125, 0.1092071533203125, 0.11812591552734375, 0.127044677734375, 0.13596343994140625, 0.1448822021484375, 0.15380096435546875, 0.1627197265625, 0.17163848876953125, 0.1805572509765625, 0.18947601318359375, 0.198394775390625, 0.20731353759765625, 0.2162322998046875, 0.22515106201171875, 0.23406982421875, 0.24298858642578125, 0.2519073486328125, 0.26082611083984375, 0.269744873046875, 0.27866363525390625, 0.2875823974609375, 0.29650115966796875, 0.305419921875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 4.0, 3.0, 6.0, 10.0, 9.0, 16.0, 7.0, 24.0, 29.0, 56.0, 77.0, 102.0, 157.0, 257.0, 363.0, 566.0, 994.0, 1598.0, 2863.0, 5377.0, 11250.0, 26975.0, 80310.0, 253380.0, 394274.0, 176427.0, 54745.0, 19895.0, 8494.0, 4363.0, 2291.0, 1336.0, 791.0, 507.0, 321.0, 219.0, 128.0, 103.0, 65.0, 45.0, 38.0, 24.0, 17.0, 11.0, 11.0, 3.0, 3.0, 4.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0], "bins": [-0.11004638671875, -0.1068410873413086, -0.10363578796386719, -0.10043048858642578, -0.09722518920898438, -0.09401988983154297, -0.09081459045410156, -0.08760929107666016, -0.08440399169921875, -0.08119869232177734, -0.07799339294433594, -0.07478809356689453, -0.07158279418945312, -0.06837749481201172, -0.06517219543457031, -0.061966896057128906, -0.0587615966796875, -0.055556297302246094, -0.05235099792480469, -0.04914569854736328, -0.045940399169921875, -0.04273509979248047, -0.03952980041503906, -0.036324501037597656, -0.03311920166015625, -0.029913902282714844, -0.026708602905273438, -0.02350330352783203, -0.020298004150390625, -0.01709270477294922, -0.013887405395507812, -0.010682106018066406, -0.007476806640625, -0.004271507263183594, -0.0010662078857421875, 0.0021390914916992188, 0.005344390869140625, 0.008549690246582031, 0.011754989624023438, 0.014960289001464844, 0.01816558837890625, 0.021370887756347656, 0.024576187133789062, 0.02778148651123047, 0.030986785888671875, 0.03419208526611328, 0.03739738464355469, 0.040602684020996094, 0.0438079833984375, 0.047013282775878906, 0.05021858215332031, 0.05342388153076172, 0.056629180908203125, 0.05983448028564453, 0.06303977966308594, 0.06624507904052734, 0.06945037841796875, 0.07265567779541016, 0.07586097717285156, 0.07906627655029297, 0.08227157592773438, 0.08547687530517578, 0.08868217468261719, 0.0918874740600586, 0.0950927734375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 15.0, 7.0, 9.0, 13.0, 20.0, 18.0, 24.0, 22.0, 22.0, 17.0, 22.0, 40.0, 30.0, 36.0, 42.0, 40.0, 36.0, 50.0, 41.0, 50.0, 52.0, 54.0, 34.0, 36.0, 35.0, 34.0, 29.0, 22.0, 23.0, 27.0, 15.0, 17.0, 11.0, 9.0, 11.0, 14.0, 5.0, 3.0, 5.0, 2.0, 2.0, 1.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.5498046875, -0.532958984375, -0.51611328125, -0.499267578125, -0.482421875, -0.465576171875, -0.44873046875, -0.431884765625, -0.4150390625, -0.398193359375, -0.38134765625, -0.364501953125, -0.34765625, -0.330810546875, -0.31396484375, -0.297119140625, -0.2802734375, -0.263427734375, -0.24658203125, -0.229736328125, -0.212890625, -0.196044921875, -0.17919921875, -0.162353515625, -0.1455078125, -0.128662109375, -0.11181640625, -0.094970703125, -0.078125, -0.061279296875, -0.04443359375, -0.027587890625, -0.0107421875, 0.006103515625, 0.02294921875, 0.039794921875, 0.056640625, 0.073486328125, 0.09033203125, 0.107177734375, 0.1240234375, 0.140869140625, 0.15771484375, 0.174560546875, 0.19140625, 0.208251953125, 0.22509765625, 0.241943359375, 0.2587890625, 0.275634765625, 0.29248046875, 0.309326171875, 0.326171875, 0.343017578125, 0.35986328125, 0.376708984375, 0.3935546875, 0.410400390625, 0.42724609375, 0.444091796875, 0.4609375, 0.477783203125, 0.49462890625, 0.511474609375, 0.5283203125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 10.0, 17.0, 23.0, 21.0, 27.0, 50.0, 83.0, 126.0, 180.0, 273.0, 444.0, 796.0, 1364.0, 2761.0, 5833.0, 14721.0, 45572.0, 152918.0, 365298.0, 302149.0, 104139.0, 31286.0, 10771.0, 4553.0, 2175.0, 1151.0, 652.0, 387.0, 251.0, 180.0, 114.0, 64.0, 49.0, 28.0, 27.0, 10.0, 14.0, 13.0, 5.0, 2.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.0316162109375, -0.030708789825439453, -0.029801368713378906, -0.02889394760131836, -0.027986526489257812, -0.027079105377197266, -0.02617168426513672, -0.025264263153076172, -0.024356842041015625, -0.023449420928955078, -0.02254199981689453, -0.021634578704833984, -0.020727157592773438, -0.01981973648071289, -0.018912315368652344, -0.018004894256591797, -0.01709747314453125, -0.016190052032470703, -0.015282630920410156, -0.01437520980834961, -0.013467788696289062, -0.012560367584228516, -0.011652946472167969, -0.010745525360107422, -0.009838104248046875, -0.008930683135986328, -0.008023262023925781, -0.007115840911865234, -0.0062084197998046875, -0.005300998687744141, -0.004393577575683594, -0.003486156463623047, -0.0025787353515625, -0.0016713142395019531, -0.0007638931274414062, 0.00014352798461914062, 0.0010509490966796875, 0.0019583702087402344, 0.0028657913208007812, 0.003773212432861328, 0.004680633544921875, 0.005588054656982422, 0.006495475769042969, 0.007402896881103516, 0.008310317993164062, 0.00921773910522461, 0.010125160217285156, 0.011032581329345703, 0.01194000244140625, 0.012847423553466797, 0.013754844665527344, 0.01466226577758789, 0.015569686889648438, 0.016477108001708984, 0.01738452911376953, 0.018291950225830078, 0.019199371337890625, 0.020106792449951172, 0.02101421356201172, 0.021921634674072266, 0.022829055786132812, 0.02373647689819336, 0.024643898010253906, 0.025551319122314453, 0.026458740234375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 5.0, 4.0, 14.0, 12.0, 34.0, 28.0, 34.0, 42.0, 61.0, 89.0, 95.0, 80.0, 95.0, 80.0, 92.0, 54.0, 46.0, 39.0, 31.0, 18.0, 18.0, 12.0, 2.0, 6.0, 3.0, 7.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5616416931152344e-05, -1.5077181160449982e-05, -1.453794538974762e-05, -1.3998709619045258e-05, -1.3459473848342896e-05, -1.2920238077640533e-05, -1.2381002306938171e-05, -1.184176653623581e-05, -1.1302530765533447e-05, -1.0763294994831085e-05, -1.0224059224128723e-05, -9.684823453426361e-06, -9.145587682723999e-06, -8.606351912021637e-06, -8.067116141319275e-06, -7.527880370616913e-06, -6.988644599914551e-06, -6.449408829212189e-06, -5.910173058509827e-06, -5.370937287807465e-06, -4.8317015171051025e-06, -4.2924657464027405e-06, -3.7532299757003784e-06, -3.2139942049980164e-06, -2.6747584342956543e-06, -2.1355226635932922e-06, -1.5962868928909302e-06, -1.0570511221885681e-06, -5.178153514862061e-07, 2.1420419216156006e-08, 5.606561899185181e-07, 1.0998919606208801e-06, 1.6391277313232422e-06, 2.1783635020256042e-06, 2.7175992727279663e-06, 3.2568350434303284e-06, 3.7960708141326904e-06, 4.3353065848350525e-06, 4.8745423555374146e-06, 5.413778126239777e-06, 5.953013896942139e-06, 6.492249667644501e-06, 7.031485438346863e-06, 7.570721209049225e-06, 8.109956979751587e-06, 8.649192750453949e-06, 9.188428521156311e-06, 9.727664291858673e-06, 1.0266900062561035e-05, 1.0806135833263397e-05, 1.134537160396576e-05, 1.1884607374668121e-05, 1.2423843145370483e-05, 1.2963078916072845e-05, 1.3502314686775208e-05, 1.404155045747757e-05, 1.4580786228179932e-05, 1.5120021998882294e-05, 1.5659257769584656e-05, 1.6198493540287018e-05, 1.673772931098938e-05, 1.7276965081691742e-05, 1.7816200852394104e-05, 1.8355436623096466e-05, 1.8894672393798828e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 7.0, 9.0, 19.0, 21.0, 27.0, 40.0, 86.0, 128.0, 209.0, 388.0, 919.0, 2420.0, 8791.0, 37122.0, 172863.0, 468487.0, 274720.0, 62444.0, 13849.0, 3670.0, 1191.0, 495.0, 235.0, 132.0, 98.0, 65.0, 38.0, 21.0, 27.0, 10.0, 12.0, 5.0, 7.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.042266845703125, -0.04093217849731445, -0.039597511291503906, -0.03826284408569336, -0.03692817687988281, -0.035593509674072266, -0.03425884246826172, -0.03292417526245117, -0.031589508056640625, -0.030254840850830078, -0.02892017364501953, -0.027585506439208984, -0.026250839233398438, -0.02491617202758789, -0.023581504821777344, -0.022246837615966797, -0.02091217041015625, -0.019577503204345703, -0.018242835998535156, -0.01690816879272461, -0.015573501586914062, -0.014238834381103516, -0.012904167175292969, -0.011569499969482422, -0.010234832763671875, -0.008900165557861328, -0.007565498352050781, -0.006230831146240234, -0.0048961639404296875, -0.0035614967346191406, -0.0022268295288085938, -0.0008921623229980469, 0.0004425048828125, 0.0017771720886230469, 0.0031118392944335938, 0.004446506500244141, 0.0057811737060546875, 0.007115840911865234, 0.008450508117675781, 0.009785175323486328, 0.011119842529296875, 0.012454509735107422, 0.013789176940917969, 0.015123844146728516, 0.016458511352539062, 0.01779317855834961, 0.019127845764160156, 0.020462512969970703, 0.02179718017578125, 0.023131847381591797, 0.024466514587402344, 0.02580118179321289, 0.027135848999023438, 0.028470516204833984, 0.02980518341064453, 0.031139850616455078, 0.032474517822265625, 0.03380918502807617, 0.03514385223388672, 0.036478519439697266, 0.03781318664550781, 0.03914785385131836, 0.040482521057128906, 0.04181718826293945, 0.04315185546875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 7.0, 7.0, 11.0, 6.0, 14.0, 12.0, 19.0, 22.0, 41.0, 46.0, 43.0, 59.0, 76.0, 84.0, 73.0, 78.0, 77.0, 64.0, 56.0, 41.0, 27.0, 39.0, 40.0, 17.0, 13.0, 10.0, 8.0, 5.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.016693115234375, -0.01629197597503662, -0.015890836715698242, -0.015489697456359863, -0.015088558197021484, -0.014687418937683105, -0.014286279678344727, -0.013885140419006348, -0.013484001159667969, -0.01308286190032959, -0.012681722640991211, -0.012280583381652832, -0.011879444122314453, -0.011478304862976074, -0.011077165603637695, -0.010676026344299316, -0.010274887084960938, -0.009873747825622559, -0.00947260856628418, -0.0090714693069458, -0.008670330047607422, -0.008269190788269043, -0.007868051528930664, -0.007466912269592285, -0.007065773010253906, -0.006664633750915527, -0.0062634944915771484, -0.0058623552322387695, -0.005461215972900391, -0.005060076713562012, -0.004658937454223633, -0.004257798194885254, -0.003856658935546875, -0.003455519676208496, -0.003054380416870117, -0.0026532411575317383, -0.0022521018981933594, -0.0018509626388549805, -0.0014498233795166016, -0.0010486841201782227, -0.0006475448608398438, -0.00024640560150146484, 0.00015473365783691406, 0.000555872917175293, 0.0009570121765136719, 0.0013581514358520508, 0.0017592906951904297, 0.0021604299545288086, 0.0025615692138671875, 0.0029627084732055664, 0.0033638477325439453, 0.0037649869918823242, 0.004166126251220703, 0.004567265510559082, 0.004968404769897461, 0.00536954402923584, 0.005770683288574219, 0.006171822547912598, 0.0065729618072509766, 0.0069741010665893555, 0.007375240325927734, 0.007776379585266113, 0.008177518844604492, 0.008578658103942871, 0.00897979736328125]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 7.0, 23.0, 69.0, 167.0, 245.0, 260.0, 150.0, 64.0, 13.0, 6.0, 3.0, 6.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.9459316730499268, -1.9085006713867188, -1.8710697889328003, -1.8336387872695923, -1.7962079048156738, -1.7587769031524658, -1.7213460206985474, -1.6839150190353394, -1.646484136581421, -1.609053134918213, -1.5716222524642944, -1.5341912508010864, -1.496760368347168, -1.45932936668396, -1.4218984842300415, -1.3844674825668335, -1.347036600112915, -1.309605598449707, -1.2721747159957886, -1.2347437143325806, -1.197312831878662, -1.159881830215454, -1.1224509477615356, -1.0850199460983276, -1.0475889444351196, -1.0101579427719116, -0.9727270603179932, -0.9352961182594299, -0.8978651762008667, -0.8604342341423035, -0.8230032920837402, -0.7855722904205322, -0.7481414079666138, -0.7107104659080505, -0.6732795238494873, -0.6358485817909241, -0.5984176397323608, -0.5609866976737976, -0.5235557556152344, -0.48612478375434875, -0.4486938714981079, -0.4112629294395447, -0.37383198738098145, -0.3364010453224182, -0.298970103263855, -0.26153916120529175, -0.22410818934440613, -0.1866772472858429, -0.14924630522727966, -0.11181536316871643, -0.0743844136595726, -0.03695346415042877, 0.00047747790813446045, 0.03790841996669769, 0.07533937692642212, 0.11277031898498535, 0.15020126104354858, 0.18763220310211182, 0.22506314516067505, 0.2624940872192383, 0.2999250292778015, 0.33735597133636475, 0.37478694319725037, 0.4122178852558136, 0.44964882731437683]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 7.0, 5.0, 10.0, 16.0, 18.0, 19.0, 20.0, 25.0, 37.0, 33.0, 41.0, 39.0, 49.0, 63.0, 62.0, 58.0, 63.0, 47.0, 61.0, 53.0, 45.0, 47.0, 38.0, 30.0, 21.0, 22.0, 21.0, 10.0, 8.0, 9.0, 9.0, 9.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2811904847621918, -0.27113327383995056, -0.26107603311538696, -0.25101882219314575, -0.24096161127090454, -0.23090438544750214, -0.22084715962409973, -0.21078994870185852, -0.20073272287845612, -0.1906754970550537, -0.1806182861328125, -0.1705610603094101, -0.1605038344860077, -0.15044662356376648, -0.14038939774036407, -0.13033217191696167, -0.12027496099472046, -0.11021774262189865, -0.10016052424907684, -0.09010329842567444, -0.08004608005285263, -0.06998886168003082, -0.059931639581918716, -0.04987441748380661, -0.0398171991109848, -0.029759978875517845, -0.019702758640050888, -0.009645538404583931, 0.0004116818308830261, 0.010468900203704834, 0.02052612230181694, 0.030583344399929047, 0.04064059257507324, 0.05069781094789505, 0.060755033046007156, 0.07081225514411926, 0.08086947351694107, 0.09092669188976288, 0.10098391771316528, 0.11104113608598709, 0.1210983544588089, 0.1311555802822113, 0.14121279120445251, 0.15127001702785492, 0.16132724285125732, 0.17138445377349854, 0.18144167959690094, 0.19149890542030334, 0.20155611634254456, 0.21161334216594696, 0.22167055308818817, 0.23172777891159058, 0.2417849898338318, 0.251842200756073, 0.2618994414806366, 0.2719566524028778, 0.2820138931274414, 0.2920711040496826, 0.3021283447742462, 0.3121855556964874, 0.32224276661872864, 0.33230000734329224, 0.34235721826553345, 0.35241442918777466, 0.36247164011001587]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 5.0, 3.0, 17.0, 15.0, 23.0, 21.0, 59.0, 95.0, 189.0, 415.0, 895.0, 2384.0, 8274.0, 35391.0, 235661.0, 658402.0, 83655.0, 16326.0, 4209.0, 1398.0, 543.0, 237.0, 128.0, 64.0, 43.0, 29.0, 21.0, 16.0, 10.0, 4.0, 6.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.458984375, -0.442138671875, -0.42529296875, -0.408447265625, -0.3916015625, -0.374755859375, -0.35791015625, -0.341064453125, -0.32421875, -0.307373046875, -0.29052734375, -0.273681640625, -0.2568359375, -0.239990234375, -0.22314453125, -0.206298828125, -0.189453125, -0.172607421875, -0.15576171875, -0.138916015625, -0.1220703125, -0.105224609375, -0.08837890625, -0.071533203125, -0.0546875, -0.037841796875, -0.02099609375, -0.004150390625, 0.0126953125, 0.029541015625, 0.04638671875, 0.063232421875, 0.080078125, 0.096923828125, 0.11376953125, 0.130615234375, 0.1474609375, 0.164306640625, 0.18115234375, 0.197998046875, 0.21484375, 0.231689453125, 0.24853515625, 0.265380859375, 0.2822265625, 0.299072265625, 0.31591796875, 0.332763671875, 0.349609375, 0.366455078125, 0.38330078125, 0.400146484375, 0.4169921875, 0.433837890625, 0.45068359375, 0.467529296875, 0.484375, 0.501220703125, 0.51806640625, 0.534912109375, 0.5517578125, 0.568603515625, 0.58544921875, 0.602294921875, 0.619140625]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 4.0, 1.0, 6.0, 12.0, 12.0, 15.0, 21.0, 42.0, 40.0, 53.0, 70.0, 63.0, 90.0, 78.0, 100.0, 79.0, 79.0, 66.0, 55.0, 41.0, 30.0, 17.0, 16.0, 10.0, 6.0, 3.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.497314453125, -0.4694633483886719, -0.44161224365234375, -0.4137611389160156, -0.3859100341796875, -0.3580589294433594, -0.33020782470703125, -0.3023567199707031, -0.274505615234375, -0.24665451049804688, -0.21880340576171875, -0.19095230102539062, -0.1631011962890625, -0.13525009155273438, -0.10739898681640625, -0.07954788208007812, -0.05169677734375, -0.023845672607421875, 0.00400543212890625, 0.031856536865234375, 0.0597076416015625, 0.08755874633789062, 0.11540985107421875, 0.14326095581054688, 0.171112060546875, 0.19896316528320312, 0.22681427001953125, 0.2546653747558594, 0.2825164794921875, 0.3103675842285156, 0.33821868896484375, 0.3660697937011719, 0.3939208984375, 0.4217720031738281, 0.44962310791015625, 0.4774742126464844, 0.5053253173828125, 0.5331764221191406, 0.5610275268554688, 0.5888786315917969, 0.616729736328125, 0.6445808410644531, 0.6724319458007812, 0.7002830505371094, 0.7281341552734375, 0.7559852600097656, 0.7838363647460938, 0.8116874694824219, 0.83953857421875, 0.8673896789550781, 0.8952407836914062, 0.9230918884277344, 0.9509429931640625, 0.9787940979003906, 1.0066452026367188, 1.0344963073730469, 1.062347412109375, 1.0901985168457031, 1.1180496215820312, 1.1459007263183594, 1.1737518310546875, 1.2016029357910156, 1.2294540405273438, 1.2573051452636719, 1.28515625]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 6.0, 2.0, 5.0, 6.0, 8.0, 10.0, 10.0, 7.0, 16.0, 12.0, 24.0, 29.0, 32.0, 54.0, 79.0, 105.0, 159.0, 290.0, 749.0, 4131.0, 75865.0, 914204.0, 48111.0, 3132.0, 707.0, 289.0, 128.0, 78.0, 69.0, 59.0, 33.0, 29.0, 32.0, 23.0, 15.0, 13.0, 12.0, 5.0, 7.0, 1.0, 3.0, 4.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.95458984375, -0.9232254028320312, -0.8918609619140625, -0.8604965209960938, -0.829132080078125, -0.7977676391601562, -0.7664031982421875, -0.7350387573242188, -0.70367431640625, -0.6723098754882812, -0.6409454345703125, -0.6095809936523438, -0.578216552734375, -0.5468521118164062, -0.5154876708984375, -0.48412322998046875, -0.4527587890625, -0.42139434814453125, -0.3900299072265625, -0.35866546630859375, -0.327301025390625, -0.29593658447265625, -0.2645721435546875, -0.23320770263671875, -0.20184326171875, -0.17047882080078125, -0.1391143798828125, -0.10774993896484375, -0.076385498046875, -0.04502105712890625, -0.0136566162109375, 0.01770782470703125, 0.049072265625, 0.08043670654296875, 0.1118011474609375, 0.14316558837890625, 0.174530029296875, 0.20589447021484375, 0.2372589111328125, 0.26862335205078125, 0.29998779296875, 0.33135223388671875, 0.3627166748046875, 0.39408111572265625, 0.425445556640625, 0.45680999755859375, 0.4881744384765625, 0.5195388793945312, 0.5509033203125, 0.5822677612304688, 0.6136322021484375, 0.6449966430664062, 0.676361083984375, 0.7077255249023438, 0.7390899658203125, 0.7704544067382812, 0.80181884765625, 0.8331832885742188, 0.8645477294921875, 0.8959121704101562, 0.927276611328125, 0.9586410522460938, 0.9900054931640625, 1.0213699340820312, 1.052734375]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 1.0, 5.0, 8.0, 9.0, 3.0, 3.0, 12.0, 12.0, 14.0, 17.0, 19.0, 24.0, 19.0, 27.0, 27.0, 30.0, 36.0, 47.0, 43.0, 48.0, 36.0, 46.0, 40.0, 39.0, 43.0, 47.0, 34.0, 38.0, 41.0, 37.0, 26.0, 18.0, 23.0, 25.0, 20.0, 11.0, 10.0, 10.0, 10.0, 11.0, 5.0, 5.0, 5.0, 5.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.5166015625, -0.49932098388671875, -0.4820404052734375, -0.46475982666015625, -0.447479248046875, -0.43019866943359375, -0.4129180908203125, -0.39563751220703125, -0.37835693359375, -0.36107635498046875, -0.3437957763671875, -0.32651519775390625, -0.309234619140625, -0.29195404052734375, -0.2746734619140625, -0.25739288330078125, -0.2401123046875, -0.22283172607421875, -0.2055511474609375, -0.18827056884765625, -0.170989990234375, -0.15370941162109375, -0.1364288330078125, -0.11914825439453125, -0.10186767578125, -0.08458709716796875, -0.0673065185546875, -0.05002593994140625, -0.032745361328125, -0.01546478271484375, 0.0018157958984375, 0.01909637451171875, 0.036376953125, 0.05365753173828125, 0.0709381103515625, 0.08821868896484375, 0.105499267578125, 0.12277984619140625, 0.1400604248046875, 0.15734100341796875, 0.17462158203125, 0.19190216064453125, 0.2091827392578125, 0.22646331787109375, 0.243743896484375, 0.26102447509765625, 0.2783050537109375, 0.29558563232421875, 0.3128662109375, 0.33014678955078125, 0.3474273681640625, 0.36470794677734375, 0.381988525390625, 0.39926910400390625, 0.4165496826171875, 0.43383026123046875, 0.45111083984375, 0.46839141845703125, 0.4856719970703125, 0.5029525756835938, 0.520233154296875, 0.5375137329101562, 0.5547943115234375, 0.5720748901367188, 0.58935546875]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 3.0, 10.0, 9.0, 13.0, 25.0, 28.0, 42.0, 60.0, 104.0, 136.0, 271.0, 625.0, 1924.0, 9704.0, 246145.0, 762704.0, 22083.0, 3021.0, 857.0, 306.0, 159.0, 84.0, 67.0, 50.0, 38.0, 24.0, 17.0, 10.0, 9.0, 9.0, 8.0, 4.0, 2.0, 1.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.3076171875, -0.298614501953125, -0.28961181640625, -0.280609130859375, -0.2716064453125, -0.262603759765625, -0.25360107421875, -0.244598388671875, -0.235595703125, -0.226593017578125, -0.21759033203125, -0.208587646484375, -0.1995849609375, -0.190582275390625, -0.18157958984375, -0.172576904296875, -0.16357421875, -0.154571533203125, -0.14556884765625, -0.136566162109375, -0.1275634765625, -0.118560791015625, -0.10955810546875, -0.100555419921875, -0.091552734375, -0.082550048828125, -0.07354736328125, -0.064544677734375, -0.0555419921875, -0.046539306640625, -0.03753662109375, -0.028533935546875, -0.01953125, -0.010528564453125, -0.00152587890625, 0.007476806640625, 0.0164794921875, 0.025482177734375, 0.03448486328125, 0.043487548828125, 0.052490234375, 0.061492919921875, 0.07049560546875, 0.079498291015625, 0.0885009765625, 0.097503662109375, 0.10650634765625, 0.115509033203125, 0.12451171875, 0.133514404296875, 0.14251708984375, 0.151519775390625, 0.1605224609375, 0.169525146484375, 0.17852783203125, 0.187530517578125, 0.196533203125, 0.205535888671875, 0.21453857421875, 0.223541259765625, 0.2325439453125, 0.241546630859375, 0.25054931640625, 0.259552001953125, 0.2685546875]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 4.0, 6.0, 12.0, 5.0, 12.0, 8.0, 21.0, 20.0, 20.0, 47.0, 76.0, 118.0, 127.0, 162.0, 117.0, 76.0, 59.0, 47.0, 20.0, 16.0, 9.0, 8.0, 5.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.236532211303711e-05, -3.14200296998024e-05, -3.0474737286567688e-05, -2.9529444873332977e-05, -2.8584152460098267e-05, -2.7638860046863556e-05, -2.6693567633628845e-05, -2.5748275220394135e-05, -2.4802982807159424e-05, -2.3857690393924713e-05, -2.2912397980690002e-05, -2.1967105567455292e-05, -2.102181315422058e-05, -2.007652074098587e-05, -1.913122832775116e-05, -1.818593591451645e-05, -1.7240643501281738e-05, -1.6295351088047028e-05, -1.5350058674812317e-05, -1.4404766261577606e-05, -1.3459473848342896e-05, -1.2514181435108185e-05, -1.1568889021873474e-05, -1.0623596608638763e-05, -9.678304195404053e-06, -8.733011782169342e-06, -7.787719368934631e-06, -6.842426955699921e-06, -5.89713454246521e-06, -4.951842129230499e-06, -4.0065497159957886e-06, -3.061257302761078e-06, -2.115964889526367e-06, -1.1706724762916565e-06, -2.253800630569458e-07, 7.199123501777649e-07, 1.6652047634124756e-06, 2.6104971766471863e-06, 3.555789589881897e-06, 4.501082003116608e-06, 5.446374416351318e-06, 6.391666829586029e-06, 7.33695924282074e-06, 8.28225165605545e-06, 9.227544069290161e-06, 1.0172836482524872e-05, 1.1118128895759583e-05, 1.2063421308994293e-05, 1.3008713722229004e-05, 1.3954006135463715e-05, 1.4899298548698425e-05, 1.5844590961933136e-05, 1.6789883375167847e-05, 1.7735175788402557e-05, 1.8680468201637268e-05, 1.962576061487198e-05, 2.057105302810669e-05, 2.15163454413414e-05, 2.246163785457611e-05, 2.340693026781082e-05, 2.4352222681045532e-05, 2.5297515094280243e-05, 2.6242807507514954e-05, 2.7188099920749664e-05, 2.8133392333984375e-05]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 3.0, 4.0, 7.0, 2.0, 5.0, 8.0, 11.0, 10.0, 10.0, 25.0, 21.0, 20.0, 38.0, 60.0, 73.0, 108.0, 142.0, 285.0, 490.0, 931.0, 1762.0, 4075.0, 12458.0, 84273.0, 729050.0, 184527.0, 19702.0, 5495.0, 2241.0, 1154.0, 553.0, 339.0, 206.0, 131.0, 84.0, 61.0, 53.0, 35.0, 30.0, 22.0, 15.0, 11.0, 5.0, 6.0, 7.0, 2.0, 3.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.2076416015625, -0.20147132873535156, -0.19530105590820312, -0.1891307830810547, -0.18296051025390625, -0.1767902374267578, -0.17061996459960938, -0.16444969177246094, -0.1582794189453125, -0.15210914611816406, -0.14593887329101562, -0.1397686004638672, -0.13359832763671875, -0.1274280548095703, -0.12125778198242188, -0.11508750915527344, -0.108917236328125, -0.10274696350097656, -0.09657669067382812, -0.09040641784667969, -0.08423614501953125, -0.07806587219238281, -0.07189559936523438, -0.06572532653808594, -0.0595550537109375, -0.05338478088378906, -0.047214508056640625, -0.04104423522949219, -0.03487396240234375, -0.028703689575195312, -0.022533416748046875, -0.016363143920898438, -0.01019287109375, -0.0040225982666015625, 0.002147674560546875, 0.008317947387695312, 0.01448822021484375, 0.020658493041992188, 0.026828765869140625, 0.03299903869628906, 0.0391693115234375, 0.04533958435058594, 0.051509857177734375, 0.05768013000488281, 0.06385040283203125, 0.07002067565917969, 0.07619094848632812, 0.08236122131347656, 0.088531494140625, 0.09470176696777344, 0.10087203979492188, 0.10704231262207031, 0.11321258544921875, 0.11938285827636719, 0.12555313110351562, 0.13172340393066406, 0.1378936767578125, 0.14406394958496094, 0.15023422241210938, 0.1564044952392578, 0.16257476806640625, 0.1687450408935547, 0.17491531372070312, 0.18108558654785156, 0.187255859375]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 8.0, 4.0, 10.0, 9.0, 10.0, 18.0, 15.0, 18.0, 42.0, 53.0, 62.0, 73.0, 103.0, 114.0, 120.0, 84.0, 76.0, 39.0, 37.0, 30.0, 25.0, 8.0, 10.0, 6.0, 9.0, 4.0, 4.0, 1.0, 0.0, 5.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.07684326171875, -0.07448101043701172, -0.07211875915527344, -0.06975650787353516, -0.06739425659179688, -0.0650320053100586, -0.06266975402832031, -0.06030750274658203, -0.05794525146484375, -0.05558300018310547, -0.05322074890136719, -0.050858497619628906, -0.048496246337890625, -0.046133995056152344, -0.04377174377441406, -0.04140949249267578, -0.0390472412109375, -0.03668498992919922, -0.03432273864746094, -0.031960487365722656, -0.029598236083984375, -0.027235984802246094, -0.024873733520507812, -0.02251148223876953, -0.02014923095703125, -0.01778697967529297, -0.015424728393554688, -0.013062477111816406, -0.010700225830078125, -0.008337974548339844, -0.0059757232666015625, -0.0036134719848632812, -0.001251220703125, 0.0011110305786132812, 0.0034732818603515625, 0.005835533142089844, 0.008197784423828125, 0.010560035705566406, 0.012922286987304688, 0.015284538269042969, 0.01764678955078125, 0.02000904083251953, 0.022371292114257812, 0.024733543395996094, 0.027095794677734375, 0.029458045959472656, 0.03182029724121094, 0.03418254852294922, 0.0365447998046875, 0.03890705108642578, 0.04126930236816406, 0.043631553649902344, 0.045993804931640625, 0.048356056213378906, 0.05071830749511719, 0.05308055877685547, 0.05544281005859375, 0.05780506134033203, 0.06016731262207031, 0.0625295639038086, 0.06489181518554688, 0.06725406646728516, 0.06961631774902344, 0.07197856903076172, 0.0743408203125]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 7.0, 199.0, 682.0, 112.0, 12.0, 1.0, 1.0, 0.0, 2.0], "bins": [-12.27834701538086, -12.064332008361816, -11.850317001342773, -11.63630199432373, -11.422286987304688, -11.208271980285645, -10.994256973266602, -10.780241012573242, -10.5662260055542, -10.352210998535156, -10.138195991516113, -9.92418098449707, -9.710165977478027, -9.496150970458984, -9.282135009765625, -9.068120956420898, -8.854105949401855, -8.640090942382812, -8.42607593536377, -8.212060928344727, -7.998045444488525, -7.784030437469482, -7.5700154304504395, -7.3560004234313965, -7.141984939575195, -6.927969932556152, -6.713954925537109, -6.499939918518066, -6.285924434661865, -6.071909427642822, -5.857894420623779, -5.643879413604736, -5.429863929748535, -5.215848922729492, -5.001833915710449, -4.787818908691406, -4.573803424835205, -4.359788417816162, -4.145773410797119, -3.931758403778076, -3.717743396759033, -3.5037283897399902, -3.289713144302368, -3.075698137283325, -2.8616831302642822, -2.64766788482666, -2.433652877807617, -2.219637870788574, -2.0056228637695312, -1.7916077375411987, -1.5775927305221558, -1.3635776042938232, -1.1495625972747803, -0.9355474710464478, -0.7215323448181152, -0.5075173377990723, -0.2935020923614502, -0.07948701083660126, 0.13452807068824768, 0.3485431671142578, 0.5625582337379456, 0.7765733003616333, 0.9905884265899658, 1.2046034336090088, 1.4186185598373413]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 7.0, 2.0, 8.0, 7.0, 7.0, 14.0, 16.0, 15.0, 16.0, 20.0, 23.0, 30.0, 34.0, 22.0, 46.0, 45.0, 61.0, 52.0, 61.0, 41.0, 63.0, 60.0, 42.0, 35.0, 31.0, 45.0, 36.0, 21.0, 31.0, 17.0, 24.0, 13.0, 19.0, 5.0, 6.0, 7.0, 11.0, 5.0, 3.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9674336314201355, -0.9344180822372437, -0.901402473449707, -0.8683869242668152, -0.8353713154792786, -0.8023557662963867, -0.7693401575088501, -0.7363246083259583, -0.7033090591430664, -0.6702935099601746, -0.6372779011726379, -0.6042623519897461, -0.5712467432022095, -0.5382311940193176, -0.5052156448364258, -0.47220003604888916, -0.43918442726135254, -0.4061688482761383, -0.3731532692909241, -0.3401377201080322, -0.3071221113204956, -0.27410656213760376, -0.24109098315238953, -0.2080754041671753, -0.17505982518196106, -0.14204424619674683, -0.10902867466211319, -0.07601310312747955, -0.04299752414226532, -0.009981945157051086, 0.023033618927001953, 0.056049197912216187, 0.0890648365020752, 0.12208041548728943, 0.15509599447250366, 0.1881115585565567, 0.22112713754177094, 0.254142701625824, 0.2871582806110382, 0.32017385959625244, 0.3531894385814667, 0.3862050175666809, 0.41922059655189514, 0.4522361755371094, 0.4852517247200012, 0.5182673335075378, 0.5512828826904297, 0.5842984914779663, 0.6173140406608582, 0.65032958984375, 0.6833451986312866, 0.7163607478141785, 0.7493763566017151, 0.7823919057846069, 0.8154075145721436, 0.8484230637550354, 0.8814386129379272, 0.9144541621208191, 0.9474697709083557, 0.9804853200912476, 1.0135009288787842, 1.0465165376663208, 1.0795320272445679, 1.1125476360321045, 1.1455632448196411]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 3.0, 7.0, 10.0, 27.0, 19.0, 50.0, 83.0, 147.0, 242.0, 447.0, 973.0, 2685.0, 10268.0, 71929.0, 1357954.0, 2572247.0, 153931.0, 16645.0, 3892.0, 1373.0, 630.0, 281.0, 177.0, 93.0, 66.0, 33.0, 26.0, 14.0, 13.0, 9.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.88037109375, -0.8599662780761719, -0.8395614624023438, -0.8191566467285156, -0.7987518310546875, -0.7783470153808594, -0.7579421997070312, -0.7375373840332031, -0.717132568359375, -0.6967277526855469, -0.6763229370117188, -0.6559181213378906, -0.6355133056640625, -0.6151084899902344, -0.5947036743164062, -0.5742988586425781, -0.55389404296875, -0.5334892272949219, -0.5130844116210938, -0.4926795959472656, -0.4722747802734375, -0.4518699645996094, -0.43146514892578125, -0.4110603332519531, -0.390655517578125, -0.3702507019042969, -0.34984588623046875, -0.3294410705566406, -0.3090362548828125, -0.2886314392089844, -0.26822662353515625, -0.24782180786132812, -0.2274169921875, -0.20701217651367188, -0.18660736083984375, -0.16620254516601562, -0.1457977294921875, -0.12539291381835938, -0.10498809814453125, -0.08458328247070312, -0.064178466796875, -0.043773651123046875, -0.02336883544921875, -0.002964019775390625, 0.0174407958984375, 0.037845611572265625, 0.05825042724609375, 0.07865524291992188, 0.09906005859375, 0.11946487426757812, 0.13986968994140625, 0.16027450561523438, 0.1806793212890625, 0.20108413696289062, 0.22148895263671875, 0.24189376831054688, 0.262298583984375, 0.2827033996582031, 0.30310821533203125, 0.3235130310058594, 0.3439178466796875, 0.3643226623535156, 0.38472747802734375, 0.4051322937011719, 0.425537109375]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 4.0, 4.0, 10.0, 9.0, 15.0, 19.0, 20.0, 22.0, 20.0, 30.0, 25.0, 46.0, 37.0, 55.0, 76.0, 68.0, 55.0, 55.0, 50.0, 58.0, 42.0, 52.0, 36.0, 47.0, 25.0, 30.0, 23.0, 19.0, 8.0, 11.0, 8.0, 9.0, 8.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.303466796875, -0.2922096252441406, -0.28095245361328125, -0.2696952819824219, -0.2584381103515625, -0.24718093872070312, -0.23592376708984375, -0.22466659545898438, -0.213409423828125, -0.20215225219726562, -0.19089508056640625, -0.17963790893554688, -0.1683807373046875, -0.15712356567382812, -0.14586639404296875, -0.13460922241210938, -0.12335205078125, -0.11209487915039062, -0.10083770751953125, -0.08958053588867188, -0.0783233642578125, -0.06706619262695312, -0.05580902099609375, -0.044551849365234375, -0.033294677734375, -0.022037506103515625, -0.01078033447265625, 0.000476837158203125, 0.0117340087890625, 0.022991180419921875, 0.03424835205078125, 0.045505523681640625, 0.0567626953125, 0.06801986694335938, 0.07927703857421875, 0.09053421020507812, 0.1017913818359375, 0.11304855346679688, 0.12430572509765625, 0.13556289672851562, 0.146820068359375, 0.15807723999023438, 0.16933441162109375, 0.18059158325195312, 0.1918487548828125, 0.20310592651367188, 0.21436309814453125, 0.22562026977539062, 0.23687744140625, 0.24813461303710938, 0.25939178466796875, 0.2706489562988281, 0.2819061279296875, 0.2931632995605469, 0.30442047119140625, 0.3156776428222656, 0.326934814453125, 0.3381919860839844, 0.34944915771484375, 0.3607063293457031, 0.3719635009765625, 0.3832206726074219, 0.39447784423828125, 0.4057350158691406, 0.4169921875]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 7.0, 6.0, 14.0, 14.0, 37.0, 50.0, 105.0, 269.0, 852.0, 4925.0, 146571.0, 3995825.0, 41634.0, 2864.0, 659.0, 207.0, 97.0, 54.0, 25.0, 26.0, 9.0, 8.0, 8.0, 4.0, 7.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7158203125, -1.6710968017578125, -1.626373291015625, -1.5816497802734375, -1.53692626953125, -1.4922027587890625, -1.447479248046875, -1.4027557373046875, -1.3580322265625, -1.3133087158203125, -1.268585205078125, -1.2238616943359375, -1.17913818359375, -1.1344146728515625, -1.089691162109375, -1.0449676513671875, -1.000244140625, -0.9555206298828125, -0.910797119140625, -0.8660736083984375, -0.82135009765625, -0.7766265869140625, -0.731903076171875, -0.6871795654296875, -0.6424560546875, -0.5977325439453125, -0.553009033203125, -0.5082855224609375, -0.46356201171875, -0.4188385009765625, -0.374114990234375, -0.3293914794921875, -0.28466796875, -0.2399444580078125, -0.195220947265625, -0.1504974365234375, -0.10577392578125, -0.0610504150390625, -0.016326904296875, 0.0283966064453125, 0.0731201171875, 0.1178436279296875, 0.162567138671875, 0.2072906494140625, 0.25201416015625, 0.2967376708984375, 0.341461181640625, 0.3861846923828125, 0.430908203125, 0.4756317138671875, 0.520355224609375, 0.5650787353515625, 0.60980224609375, 0.6545257568359375, 0.699249267578125, 0.7439727783203125, 0.7886962890625, 0.8334197998046875, 0.878143310546875, 0.9228668212890625, 0.96759033203125, 1.0123138427734375, 1.057037353515625, 1.1017608642578125, 1.146484375]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 5.0, 5.0, 7.0, 8.0, 13.0, 13.0, 21.0, 37.0, 66.0, 73.0, 127.0, 216.0, 396.0, 605.0, 752.0, 636.0, 488.0, 245.0, 125.0, 100.0, 47.0, 27.0, 16.0, 6.0, 13.0, 3.0, 8.0, 6.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17041015625, -0.1642284393310547, -0.15804672241210938, -0.15186500549316406, -0.14568328857421875, -0.13950157165527344, -0.13331985473632812, -0.1271381378173828, -0.1209564208984375, -0.11477470397949219, -0.10859298706054688, -0.10241127014160156, -0.09622955322265625, -0.09004783630371094, -0.08386611938476562, -0.07768440246582031, -0.071502685546875, -0.06532096862792969, -0.059139251708984375, -0.05295753479003906, -0.04677581787109375, -0.04059410095214844, -0.034412384033203125, -0.028230667114257812, -0.0220489501953125, -0.015867233276367188, -0.009685516357421875, -0.0035037994384765625, 0.00267791748046875, 0.008859634399414062, 0.015041351318359375, 0.021223068237304688, 0.02740478515625, 0.03358650207519531, 0.039768218994140625, 0.04594993591308594, 0.05213165283203125, 0.05831336975097656, 0.06449508666992188, 0.07067680358886719, 0.0768585205078125, 0.08304023742675781, 0.08922195434570312, 0.09540367126464844, 0.10158538818359375, 0.10776710510253906, 0.11394882202148438, 0.12013053894042969, 0.126312255859375, 0.1324939727783203, 0.13867568969726562, 0.14485740661621094, 0.15103912353515625, 0.15722084045410156, 0.16340255737304688, 0.1695842742919922, 0.1757659912109375, 0.1819477081298828, 0.18812942504882812, 0.19431114196777344, 0.20049285888671875, 0.20667457580566406, 0.21285629272460938, 0.2190380096435547, 0.2252197265625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 6.0, 11.0, 13.0, 22.0, 24.0, 38.0, 52.0, 72.0, 78.0, 87.0, 97.0, 103.0, 89.0, 85.0, 65.0, 45.0, 36.0, 34.0, 22.0, 11.0, 7.0, 8.0, 5.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.7341853380203247, -0.7143028974533081, -0.6944205164909363, -0.6745380759239197, -0.6546556949615479, -0.6347732543945312, -0.6148908138275146, -0.595008373260498, -0.5751259922981262, -0.5552435517311096, -0.5353611707687378, -0.5154787302017212, -0.495596319437027, -0.47571390867233276, -0.45583146810531616, -0.43594905734062195, -0.41606664657592773, -0.3961842358112335, -0.3763018250465393, -0.3564193844795227, -0.3365369737148285, -0.3166545629501343, -0.2967721223831177, -0.27688971161842346, -0.25700730085372925, -0.23712489008903503, -0.21724246442317963, -0.19736003875732422, -0.17747762799263, -0.1575952172279358, -0.13771279156208038, -0.11783036589622498, -0.09794789552688599, -0.07806547731161118, -0.058183059096336365, -0.038300640881061554, -0.018418222665786743, 0.0014641955494880676, 0.02134661376476288, 0.041229039430618286, 0.0611114501953125, 0.08099386841058731, 0.10087628662586212, 0.12075870484113693, 0.14064112305641174, 0.16052353382110596, 0.18040595948696136, 0.20028838515281677, 0.220170795917511, 0.2400532066822052, 0.2599356174468994, 0.279818058013916, 0.29970046877861023, 0.31958287954330444, 0.33946532011032104, 0.35934773087501526, 0.3792301416397095, 0.3991125524044037, 0.4189949631690979, 0.4388774037361145, 0.4587598145008087, 0.47864222526550293, 0.49852466583251953, 0.5184071063995361, 0.538289487361908]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 4.0, 1.0, 4.0, 4.0, 10.0, 6.0, 13.0, 17.0, 23.0, 17.0, 23.0, 16.0, 30.0, 26.0, 34.0, 52.0, 33.0, 29.0, 37.0, 32.0, 61.0, 32.0, 38.0, 54.0, 46.0, 37.0, 36.0, 31.0, 34.0, 41.0, 36.0, 21.0, 24.0, 20.0, 22.0, 13.0, 14.0, 9.0, 11.0, 8.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.3390185832977295, -0.32841241359710693, -0.317806214094162, -0.30720004439353943, -0.29659387469291687, -0.2859877049922943, -0.27538150548934937, -0.2647753357887268, -0.25416916608810425, -0.2435629814863205, -0.23295681178569794, -0.22235062718391418, -0.21174445748329163, -0.20113827288150787, -0.19053208827972412, -0.17992591857910156, -0.1693197339773178, -0.15871354937553406, -0.1481073796749115, -0.13750119507312775, -0.1268950253725052, -0.11628884077072144, -0.10568266361951828, -0.09507648646831512, -0.08447030931711197, -0.07386413216590881, -0.06325795501470566, -0.052651774138212204, -0.04204559698700905, -0.03143941983580589, -0.02083323895931244, -0.010227061808109283, 0.00037911534309387207, 0.010985293425619602, 0.021591471508145332, 0.03219765052199364, 0.04280382767319679, 0.05341000482439995, 0.0640161857008934, 0.07462236285209656, 0.08522854000329971, 0.09583471715450287, 0.10644089430570602, 0.11704707145690918, 0.12765325605869293, 0.1382594257593155, 0.14886561036109924, 0.1594717800617218, 0.17007796466350555, 0.1806841492652893, 0.19129031896591187, 0.20189650356769562, 0.21250267326831818, 0.22310885787010193, 0.2337150275707245, 0.24432121217250824, 0.254927396774292, 0.26553356647491455, 0.2761397659778595, 0.28674593567848206, 0.2973521053791046, 0.3079582750797272, 0.3185644745826721, 0.3291706442832947, 0.33977681398391724]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 5.0, 8.0, 23.0, 55.0, 128.0, 347.0, 1009.0, 2957.0, 9645.0, 47167.0, 676926.0, 277919.0, 23222.0, 6088.0, 1929.0, 690.0, 252.0, 97.0, 39.0, 17.0, 8.0, 3.0, 5.0, 6.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.275146484375, -0.26488494873046875, -0.2546234130859375, -0.24436187744140625, -0.234100341796875, -0.22383880615234375, -0.2135772705078125, -0.20331573486328125, -0.19305419921875, -0.18279266357421875, -0.1725311279296875, -0.16226959228515625, -0.152008056640625, -0.14174652099609375, -0.1314849853515625, -0.12122344970703125, -0.1109619140625, -0.10070037841796875, -0.0904388427734375, -0.08017730712890625, -0.069915771484375, -0.05965423583984375, -0.0493927001953125, -0.03913116455078125, -0.02886962890625, -0.01860809326171875, -0.0083465576171875, 0.00191497802734375, 0.012176513671875, 0.02243804931640625, 0.0326995849609375, 0.04296112060546875, 0.05322265625, 0.06348419189453125, 0.0737457275390625, 0.08400726318359375, 0.094268798828125, 0.10453033447265625, 0.1147918701171875, 0.12505340576171875, 0.13531494140625, 0.14557647705078125, 0.1558380126953125, 0.16609954833984375, 0.176361083984375, 0.18662261962890625, 0.1968841552734375, 0.20714569091796875, 0.2174072265625, 0.22766876220703125, 0.2379302978515625, 0.24819183349609375, 0.258453369140625, 0.26871490478515625, 0.2789764404296875, 0.28923797607421875, 0.29949951171875, 0.30976104736328125, 0.3200225830078125, 0.33028411865234375, 0.340545654296875, 0.35080718994140625, 0.3610687255859375, 0.37133026123046875, 0.381591796875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 4.0, 4.0, 12.0, 11.0, 16.0, 17.0, 23.0, 38.0, 29.0, 36.0, 48.0, 48.0, 56.0, 63.0, 68.0, 52.0, 54.0, 64.0, 53.0, 60.0, 42.0, 35.0, 43.0, 32.0, 26.0, 24.0, 13.0, 8.0, 7.0, 7.0, 4.0, 5.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2235107421875, -0.2151012420654297, -0.20669174194335938, -0.19828224182128906, -0.18987274169921875, -0.18146324157714844, -0.17305374145507812, -0.1646442413330078, -0.1562347412109375, -0.1478252410888672, -0.13941574096679688, -0.13100624084472656, -0.12259674072265625, -0.11418724060058594, -0.10577774047851562, -0.09736824035644531, -0.088958740234375, -0.08054924011230469, -0.07213973999023438, -0.06373023986816406, -0.05532073974609375, -0.04691123962402344, -0.038501739501953125, -0.030092239379882812, -0.0216827392578125, -0.013273239135742188, -0.004863739013671875, 0.0035457611083984375, 0.01195526123046875, 0.020364761352539062, 0.028774261474609375, 0.03718376159667969, 0.04559326171875, 0.05400276184082031, 0.062412261962890625, 0.07082176208496094, 0.07923126220703125, 0.08764076232910156, 0.09605026245117188, 0.10445976257324219, 0.1128692626953125, 0.12127876281738281, 0.12968826293945312, 0.13809776306152344, 0.14650726318359375, 0.15491676330566406, 0.16332626342773438, 0.1717357635498047, 0.180145263671875, 0.1885547637939453, 0.19696426391601562, 0.20537376403808594, 0.21378326416015625, 0.22219276428222656, 0.23060226440429688, 0.2390117645263672, 0.2474212646484375, 0.2558307647705078, 0.2642402648925781, 0.27264976501464844, 0.28105926513671875, 0.28946876525878906, 0.2978782653808594, 0.3062877655029297, 0.314697265625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 5.0, 11.0, 11.0, 19.0, 21.0, 38.0, 64.0, 98.0, 118.0, 200.0, 287.0, 457.0, 810.0, 1454.0, 2751.0, 5380.0, 11867.0, 29624.0, 88168.0, 262994.0, 377993.0, 173585.0, 55176.0, 19994.0, 8305.0, 4020.0, 2110.0, 1195.0, 689.0, 399.0, 247.0, 162.0, 93.0, 76.0, 43.0, 36.0, 15.0, 20.0, 7.0, 3.0, 8.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0823974609375, -0.07967758178710938, -0.07695770263671875, -0.07423782348632812, -0.0715179443359375, -0.06879806518554688, -0.06607818603515625, -0.06335830688476562, -0.060638427734375, -0.057918548583984375, -0.05519866943359375, -0.052478790283203125, -0.0497589111328125, -0.047039031982421875, -0.04431915283203125, -0.041599273681640625, -0.03887939453125, -0.036159515380859375, -0.03343963623046875, -0.030719757080078125, -0.0279998779296875, -0.025279998779296875, -0.02256011962890625, -0.019840240478515625, -0.017120361328125, -0.014400482177734375, -0.01168060302734375, -0.008960723876953125, -0.0062408447265625, -0.003520965576171875, -0.00080108642578125, 0.001918792724609375, 0.004638671875, 0.007358551025390625, 0.01007843017578125, 0.012798309326171875, 0.0155181884765625, 0.018238067626953125, 0.02095794677734375, 0.023677825927734375, 0.026397705078125, 0.029117584228515625, 0.03183746337890625, 0.034557342529296875, 0.0372772216796875, 0.039997100830078125, 0.04271697998046875, 0.045436859130859375, 0.04815673828125, 0.050876617431640625, 0.05359649658203125, 0.056316375732421875, 0.0590362548828125, 0.061756134033203125, 0.06447601318359375, 0.06719589233398438, 0.069915771484375, 0.07263565063476562, 0.07535552978515625, 0.07807540893554688, 0.0807952880859375, 0.08351516723632812, 0.08623504638671875, 0.08895492553710938, 0.0916748046875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 8.0, 3.0, 3.0, 4.0, 7.0, 8.0, 6.0, 7.0, 11.0, 14.0, 13.0, 24.0, 19.0, 25.0, 31.0, 31.0, 29.0, 25.0, 31.0, 26.0, 39.0, 44.0, 43.0, 45.0, 44.0, 38.0, 29.0, 33.0, 36.0, 30.0, 36.0, 31.0, 26.0, 32.0, 12.0, 23.0, 20.0, 29.0, 18.0, 11.0, 13.0, 5.0, 4.0, 10.0, 5.0, 6.0, 3.0, 2.0, 1.0, 5.0, 5.0, 4.0, 2.0, 3.0], "bins": [-0.3837890625, -0.3726043701171875, -0.361419677734375, -0.3502349853515625, -0.33905029296875, -0.3278656005859375, -0.316680908203125, -0.3054962158203125, -0.2943115234375, -0.2831268310546875, -0.271942138671875, -0.2607574462890625, -0.24957275390625, -0.2383880615234375, -0.227203369140625, -0.2160186767578125, -0.204833984375, -0.1936492919921875, -0.182464599609375, -0.1712799072265625, -0.16009521484375, -0.1489105224609375, -0.137725830078125, -0.1265411376953125, -0.1153564453125, -0.1041717529296875, -0.092987060546875, -0.0818023681640625, -0.07061767578125, -0.0594329833984375, -0.048248291015625, -0.0370635986328125, -0.02587890625, -0.0146942138671875, -0.003509521484375, 0.0076751708984375, 0.01885986328125, 0.0300445556640625, 0.041229248046875, 0.0524139404296875, 0.0635986328125, 0.0747833251953125, 0.085968017578125, 0.0971527099609375, 0.10833740234375, 0.1195220947265625, 0.130706787109375, 0.1418914794921875, 0.153076171875, 0.1642608642578125, 0.175445556640625, 0.1866302490234375, 0.19781494140625, 0.2089996337890625, 0.220184326171875, 0.2313690185546875, 0.2425537109375, 0.2537384033203125, 0.264923095703125, 0.2761077880859375, 0.28729248046875, 0.2984771728515625, 0.309661865234375, 0.3208465576171875, 0.33203125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 6.0, 8.0, 5.0, 8.0, 10.0, 15.0, 21.0, 44.0, 55.0, 82.0, 122.0, 190.0, 299.0, 549.0, 999.0, 2309.0, 5566.0, 17916.0, 78059.0, 369690.0, 436534.0, 102203.0, 22008.0, 6732.0, 2527.0, 1104.0, 638.0, 328.0, 171.0, 111.0, 77.0, 55.0, 36.0, 17.0, 11.0, 11.0, 8.0, 7.0, 3.0, 3.0, 2.0, 10.0, 3.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 3.0], "bins": [-0.044830322265625, -0.04347515106201172, -0.04211997985839844, -0.040764808654785156, -0.039409637451171875, -0.038054466247558594, -0.03669929504394531, -0.03534412384033203, -0.03398895263671875, -0.03263378143310547, -0.03127861022949219, -0.029923439025878906, -0.028568267822265625, -0.027213096618652344, -0.025857925415039062, -0.02450275421142578, -0.0231475830078125, -0.02179241180419922, -0.020437240600585938, -0.019082069396972656, -0.017726898193359375, -0.016371726989746094, -0.015016555786132812, -0.013661384582519531, -0.01230621337890625, -0.010951042175292969, -0.009595870971679688, -0.008240699768066406, -0.006885528564453125, -0.005530357360839844, -0.0041751861572265625, -0.0028200149536132812, -0.00146484375, -0.00010967254638671875, 0.0012454986572265625, 0.0026006698608398438, 0.003955841064453125, 0.005311012268066406, 0.0066661834716796875, 0.008021354675292969, 0.00937652587890625, 0.010731697082519531, 0.012086868286132812, 0.013442039489746094, 0.014797210693359375, 0.016152381896972656, 0.017507553100585938, 0.01886272430419922, 0.0202178955078125, 0.02157306671142578, 0.022928237915039062, 0.024283409118652344, 0.025638580322265625, 0.026993751525878906, 0.028348922729492188, 0.02970409393310547, 0.03105926513671875, 0.03241443634033203, 0.03376960754394531, 0.035124778747558594, 0.036479949951171875, 0.037835121154785156, 0.03919029235839844, 0.04054546356201172, 0.041900634765625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 5.0, 2.0, 2.0, 7.0, 7.0, 4.0, 8.0, 22.0, 29.0, 39.0, 35.0, 48.0, 49.0, 76.0, 83.0, 101.0, 69.0, 88.0, 62.0, 64.0, 58.0, 35.0, 21.0, 25.0, 14.0, 9.0, 14.0, 6.0, 4.0, 4.0, 8.0, 4.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.704692840576172e-05, -1.6460195183753967e-05, -1.5873461961746216e-05, -1.5286728739738464e-05, -1.4699995517730713e-05, -1.4113262295722961e-05, -1.352652907371521e-05, -1.2939795851707458e-05, -1.2353062629699707e-05, -1.1766329407691956e-05, -1.1179596185684204e-05, -1.0592862963676453e-05, -1.0006129741668701e-05, -9.41939651966095e-06, -8.832663297653198e-06, -8.245930075645447e-06, -7.659196853637695e-06, -7.072463631629944e-06, -6.485730409622192e-06, -5.898997187614441e-06, -5.3122639656066895e-06, -4.725530743598938e-06, -4.1387975215911865e-06, -3.552064299583435e-06, -2.9653310775756836e-06, -2.378597855567932e-06, -1.7918646335601807e-06, -1.2051314115524292e-06, -6.183981895446777e-07, -3.166496753692627e-08, 5.550682544708252e-07, 1.1418014764785767e-06, 1.7285346984863281e-06, 2.3152679204940796e-06, 2.902001142501831e-06, 3.4887343645095825e-06, 4.075467586517334e-06, 4.6622008085250854e-06, 5.248934030532837e-06, 5.835667252540588e-06, 6.42240047454834e-06, 7.009133696556091e-06, 7.595866918563843e-06, 8.182600140571594e-06, 8.769333362579346e-06, 9.356066584587097e-06, 9.942799806594849e-06, 1.05295330286026e-05, 1.1116266250610352e-05, 1.1702999472618103e-05, 1.2289732694625854e-05, 1.2876465916633606e-05, 1.3463199138641357e-05, 1.4049932360649109e-05, 1.463666558265686e-05, 1.5223398804664612e-05, 1.5810132026672363e-05, 1.6396865248680115e-05, 1.6983598470687866e-05, 1.7570331692695618e-05, 1.815706491470337e-05, 1.874379813671112e-05, 1.9330531358718872e-05, 1.9917264580726624e-05, 2.0503997802734375e-05]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 11.0, 2.0, 13.0, 8.0, 25.0, 25.0, 50.0, 96.0, 173.0, 337.0, 866.0, 2598.0, 9546.0, 46565.0, 263821.0, 542250.0, 146783.0, 26511.0, 5916.0, 1659.0, 664.0, 282.0, 126.0, 75.0, 42.0, 47.0, 14.0, 14.0, 10.0, 4.0, 2.0, 5.0, 3.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.054779052734375, -0.05291128158569336, -0.05104351043701172, -0.04917573928833008, -0.04730796813964844, -0.0454401969909668, -0.043572425842285156, -0.041704654693603516, -0.039836883544921875, -0.037969112396240234, -0.036101341247558594, -0.03423357009887695, -0.03236579895019531, -0.030498027801513672, -0.02863025665283203, -0.02676248550415039, -0.02489471435546875, -0.02302694320678711, -0.02115917205810547, -0.019291400909423828, -0.017423629760742188, -0.015555858612060547, -0.013688087463378906, -0.011820316314697266, -0.009952545166015625, -0.008084774017333984, -0.006217002868652344, -0.004349231719970703, -0.0024814605712890625, -0.0006136894226074219, 0.0012540817260742188, 0.0031218528747558594, 0.0049896240234375, 0.006857395172119141, 0.008725166320800781, 0.010592937469482422, 0.012460708618164062, 0.014328479766845703, 0.016196250915527344, 0.018064022064208984, 0.019931793212890625, 0.021799564361572266, 0.023667335510253906, 0.025535106658935547, 0.027402877807617188, 0.029270648956298828, 0.03113842010498047, 0.03300619125366211, 0.03487396240234375, 0.03674173355102539, 0.03860950469970703, 0.04047727584838867, 0.04234504699707031, 0.04421281814575195, 0.046080589294433594, 0.047948360443115234, 0.049816131591796875, 0.051683902740478516, 0.053551673889160156, 0.0554194450378418, 0.05728721618652344, 0.05915498733520508, 0.06102275848388672, 0.06289052963256836, 0.06475830078125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 4.0, 1.0, 5.0, 4.0, 14.0, 12.0, 19.0, 34.0, 37.0, 54.0, 78.0, 96.0, 112.0, 120.0, 120.0, 79.0, 67.0, 52.0, 34.0, 18.0, 18.0, 11.0, 9.0, 1.0, 0.0, 3.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.018646240234375, -0.018119215965270996, -0.017592191696166992, -0.01706516742706299, -0.016538143157958984, -0.01601111888885498, -0.015484094619750977, -0.014957070350646973, -0.014430046081542969, -0.013903021812438965, -0.013375997543334961, -0.012848973274230957, -0.012321949005126953, -0.01179492473602295, -0.011267900466918945, -0.010740876197814941, -0.010213851928710938, -0.009686827659606934, -0.00915980339050293, -0.008632779121398926, -0.008105754852294922, -0.007578730583190918, -0.007051706314086914, -0.00652468204498291, -0.005997657775878906, -0.005470633506774902, -0.0049436092376708984, -0.0044165849685668945, -0.0038895606994628906, -0.0033625364303588867, -0.002835512161254883, -0.002308487892150879, -0.001781463623046875, -0.001254439353942871, -0.0007274150848388672, -0.00020039081573486328, 0.0003266334533691406, 0.0008536577224731445, 0.0013806819915771484, 0.0019077062606811523, 0.0024347305297851562, 0.00296175479888916, 0.003488779067993164, 0.004015803337097168, 0.004542827606201172, 0.005069851875305176, 0.00559687614440918, 0.006123900413513184, 0.0066509246826171875, 0.007177948951721191, 0.007704973220825195, 0.0082319974899292, 0.008759021759033203, 0.009286046028137207, 0.009813070297241211, 0.010340094566345215, 0.010867118835449219, 0.011394143104553223, 0.011921167373657227, 0.01244819164276123, 0.012975215911865234, 0.013502240180969238, 0.014029264450073242, 0.014556288719177246, 0.01508331298828125]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 6.0, 12.0, 17.0, 23.0, 28.0, 46.0, 78.0, 114.0, 122.0, 114.0, 121.0, 95.0, 80.0, 53.0, 47.0, 18.0, 16.0, 8.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.4926278293132782, -0.4795452356338501, -0.4664626121520996, -0.4533800184726715, -0.4402974247932434, -0.4272148013114929, -0.4141322076320648, -0.4010496139526367, -0.3879670202732086, -0.3748844265937805, -0.36180180311203003, -0.34871920943260193, -0.33563661575317383, -0.32255399227142334, -0.30947139859199524, -0.29638880491256714, -0.28330618143081665, -0.27022358775138855, -0.25714096426963806, -0.24405837059020996, -0.23097577691078186, -0.21789316833019257, -0.20481055974960327, -0.19172796607017517, -0.17864537239074707, -0.16556276381015778, -0.15248017013072968, -0.13939756155014038, -0.12631496787071228, -0.11323235929012299, -0.10014975816011429, -0.08706715703010559, -0.07398456335067749, -0.06090196222066879, -0.047819361090660095, -0.0347367562353611, -0.0216541551053524, -0.008571550250053406, 0.004511050879955292, 0.01759365200996399, 0.030676253139972687, 0.043758854269981384, 0.05684145539999008, 0.06992405652999878, 0.08300666511058807, 0.09608926624059677, 0.10917186737060547, 0.12225446850061417, 0.13533706963062286, 0.14841967821121216, 0.16150227189064026, 0.17458488047122955, 0.18766747415065765, 0.20075008273124695, 0.21383267641067505, 0.22691528499126434, 0.23999789357185364, 0.25308048725128174, 0.2661631107330322, 0.2792457044124603, 0.2923282980918884, 0.3054109215736389, 0.318493515253067, 0.3315761089324951, 0.3446587026119232]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 5.0, 0.0, 7.0, 6.0, 9.0, 12.0, 16.0, 16.0, 28.0, 30.0, 33.0, 28.0, 41.0, 48.0, 49.0, 38.0, 51.0, 51.0, 48.0, 51.0, 51.0, 46.0, 48.0, 39.0, 46.0, 35.0, 37.0, 33.0, 20.0, 22.0, 18.0, 10.0, 6.0, 15.0, 3.0, 6.0, 0.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1983073204755783, -0.19137267768383026, -0.18443803489208221, -0.17750339210033417, -0.17056876420974731, -0.16363412141799927, -0.15669947862625122, -0.14976483583450317, -0.14283019304275513, -0.13589555025100708, -0.12896090745925903, -0.12202627211809158, -0.11509162932634354, -0.10815698653459549, -0.10122235119342804, -0.09428770840167999, -0.08735306560993195, -0.0804184228181839, -0.07348378002643585, -0.0665491446852684, -0.059614501893520355, -0.05267985910177231, -0.04574522003531456, -0.03881058096885681, -0.031875938177108765, -0.024941297248005867, -0.01800665631890297, -0.011072015389800072, -0.004137374460697174, 0.002797268331050873, 0.009731907397508621, 0.01666654646396637, 0.023601189255714417, 0.030535830184817314, 0.03747047111392021, 0.04440511018037796, 0.05133975297212601, 0.058274395763874054, 0.0652090311050415, 0.07214367389678955, 0.0790783166885376, 0.08601295948028564, 0.09294760227203369, 0.09988223761320114, 0.10681688040494919, 0.11375152319669724, 0.12068615853786469, 0.12762080132961273, 0.13455544412136078, 0.14149008691310883, 0.14842472970485687, 0.15535937249660492, 0.16229400038719177, 0.16922864317893982, 0.17616328597068787, 0.1830979287624359, 0.19003257155418396, 0.196967214345932, 0.20390185713768005, 0.2108364999294281, 0.21777114272117615, 0.2247057855129242, 0.23164041340351105, 0.2385750561952591, 0.24550969898700714]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 8.0, 8.0, 15.0, 20.0, 45.0, 76.0, 141.0, 302.0, 610.0, 1434.0, 3645.0, 10822.0, 35801.0, 152449.0, 578759.0, 200497.0, 43706.0, 13002.0, 4270.0, 1563.0, 680.0, 321.0, 154.0, 83.0, 64.0, 32.0, 14.0, 14.0, 8.0, 8.0, 4.0, 1.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33349609375, -0.32045745849609375, -0.3074188232421875, -0.29438018798828125, -0.281341552734375, -0.26830291748046875, -0.2552642822265625, -0.24222564697265625, -0.22918701171875, -0.21614837646484375, -0.2031097412109375, -0.19007110595703125, -0.177032470703125, -0.16399383544921875, -0.1509552001953125, -0.13791656494140625, -0.1248779296875, -0.11183929443359375, -0.0988006591796875, -0.08576202392578125, -0.072723388671875, -0.05968475341796875, -0.0466461181640625, -0.03360748291015625, -0.02056884765625, -0.00753021240234375, 0.0055084228515625, 0.01854705810546875, 0.031585693359375, 0.04462432861328125, 0.0576629638671875, 0.07070159912109375, 0.083740234375, 0.09677886962890625, 0.1098175048828125, 0.12285614013671875, 0.135894775390625, 0.14893341064453125, 0.1619720458984375, 0.17501068115234375, 0.18804931640625, 0.20108795166015625, 0.2141265869140625, 0.22716522216796875, 0.240203857421875, 0.25324249267578125, 0.2662811279296875, 0.27931976318359375, 0.2923583984375, 0.30539703369140625, 0.3184356689453125, 0.33147430419921875, 0.344512939453125, 0.35755157470703125, 0.3705902099609375, 0.38362884521484375, 0.39666748046875, 0.40970611572265625, 0.4227447509765625, 0.43578338623046875, 0.448822021484375, 0.46186065673828125, 0.4748992919921875, 0.48793792724609375, 0.5009765625]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 6.0, 3.0, 5.0, 9.0, 12.0, 12.0, 8.0, 17.0, 20.0, 22.0, 26.0, 42.0, 33.0, 37.0, 39.0, 43.0, 44.0, 42.0, 50.0, 50.0, 36.0, 44.0, 42.0, 41.0, 42.0, 47.0, 42.0, 22.0, 29.0, 30.0, 20.0, 19.0, 16.0, 17.0, 8.0, 7.0, 8.0, 6.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.382568359375, -0.37010955810546875, -0.3576507568359375, -0.34519195556640625, -0.332733154296875, -0.32027435302734375, -0.3078155517578125, -0.29535675048828125, -0.28289794921875, -0.27043914794921875, -0.2579803466796875, -0.24552154541015625, -0.233062744140625, -0.22060394287109375, -0.2081451416015625, -0.19568634033203125, -0.1832275390625, -0.17076873779296875, -0.1583099365234375, -0.14585113525390625, -0.133392333984375, -0.12093353271484375, -0.1084747314453125, -0.09601593017578125, -0.08355712890625, -0.07109832763671875, -0.0586395263671875, -0.04618072509765625, -0.033721923828125, -0.02126312255859375, -0.0088043212890625, 0.00365447998046875, 0.01611328125, 0.02857208251953125, 0.0410308837890625, 0.05348968505859375, 0.065948486328125, 0.07840728759765625, 0.0908660888671875, 0.10332489013671875, 0.11578369140625, 0.12824249267578125, 0.1407012939453125, 0.15316009521484375, 0.165618896484375, 0.17807769775390625, 0.1905364990234375, 0.20299530029296875, 0.2154541015625, 0.22791290283203125, 0.2403717041015625, 0.25283050537109375, 0.265289306640625, 0.27774810791015625, 0.2902069091796875, 0.30266571044921875, 0.31512451171875, 0.32758331298828125, 0.3400421142578125, 0.35250091552734375, 0.364959716796875, 0.37741851806640625, 0.3898773193359375, 0.40233612060546875, 0.414794921875]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 3.0, 0.0, 3.0, 2.0, 7.0, 10.0, 14.0, 11.0, 22.0, 34.0, 33.0, 54.0, 94.0, 124.0, 244.0, 613.0, 1549.0, 5899.0, 27802.0, 199342.0, 686716.0, 102964.0, 16937.0, 3856.0, 1154.0, 448.0, 217.0, 122.0, 102.0, 61.0, 22.0, 27.0, 27.0, 16.0, 7.0, 5.0, 2.0, 5.0, 1.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.59033203125, -0.5740928649902344, -0.5578536987304688, -0.5416145324707031, -0.5253753662109375, -0.5091361999511719, -0.49289703369140625, -0.4766578674316406, -0.460418701171875, -0.4441795349121094, -0.42794036865234375, -0.4117012023925781, -0.3954620361328125, -0.3792228698730469, -0.36298370361328125, -0.3467445373535156, -0.33050537109375, -0.3142662048339844, -0.29802703857421875, -0.2817878723144531, -0.2655487060546875, -0.24930953979492188, -0.23307037353515625, -0.21683120727539062, -0.200592041015625, -0.18435287475585938, -0.16811370849609375, -0.15187454223632812, -0.1356353759765625, -0.11939620971679688, -0.10315704345703125, -0.08691787719726562, -0.0706787109375, -0.054439544677734375, -0.03820037841796875, -0.021961212158203125, -0.0057220458984375, 0.010517120361328125, 0.02675628662109375, 0.042995452880859375, 0.059234619140625, 0.07547378540039062, 0.09171295166015625, 0.10795211791992188, 0.1241912841796875, 0.14043045043945312, 0.15666961669921875, 0.17290878295898438, 0.18914794921875, 0.20538711547851562, 0.22162628173828125, 0.23786544799804688, 0.2541046142578125, 0.2703437805175781, 0.28658294677734375, 0.3028221130371094, 0.319061279296875, 0.3353004455566406, 0.35153961181640625, 0.3677787780761719, 0.3840179443359375, 0.4002571105957031, 0.41649627685546875, 0.4327354431152344, 0.448974609375]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 4.0, 0.0, 3.0, 3.0, 4.0, 7.0, 4.0, 8.0, 7.0, 4.0, 11.0, 16.0, 13.0, 19.0, 14.0, 29.0, 23.0, 32.0, 26.0, 41.0, 47.0, 60.0, 37.0, 51.0, 50.0, 60.0, 50.0, 52.0, 53.0, 45.0, 36.0, 34.0, 27.0, 25.0, 17.0, 15.0, 17.0, 11.0, 6.0, 8.0, 10.0, 9.0, 6.0, 3.0, 6.0, 3.0, 3.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.379150390625, -0.3644981384277344, -0.34984588623046875, -0.3351936340332031, -0.3205413818359375, -0.3058891296386719, -0.29123687744140625, -0.2765846252441406, -0.261932373046875, -0.24728012084960938, -0.23262786865234375, -0.21797561645507812, -0.2033233642578125, -0.18867111206054688, -0.17401885986328125, -0.15936660766601562, -0.14471435546875, -0.13006210327148438, -0.11540985107421875, -0.10075759887695312, -0.0861053466796875, -0.07145309448242188, -0.05680084228515625, -0.042148590087890625, -0.027496337890625, -0.012844085693359375, 0.00180816650390625, 0.016460418701171875, 0.0311126708984375, 0.045764923095703125, 0.06041717529296875, 0.07506942749023438, 0.0897216796875, 0.10437393188476562, 0.11902618408203125, 0.13367843627929688, 0.1483306884765625, 0.16298294067382812, 0.17763519287109375, 0.19228744506835938, 0.206939697265625, 0.22159194946289062, 0.23624420166015625, 0.2508964538574219, 0.2655487060546875, 0.2802009582519531, 0.29485321044921875, 0.3095054626464844, 0.32415771484375, 0.3388099670410156, 0.35346221923828125, 0.3681144714355469, 0.3827667236328125, 0.3974189758300781, 0.41207122802734375, 0.4267234802246094, 0.441375732421875, 0.4560279846191406, 0.47068023681640625, 0.4853324890136719, 0.4999847412109375, 0.5146369934082031, 0.5292892456054688, 0.5439414978027344, 0.55859375]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 3.0, 4.0, 5.0, 6.0, 17.0, 12.0, 25.0, 53.0, 58.0, 133.0, 241.0, 524.0, 964.0, 2354.0, 6284.0, 21392.0, 113168.0, 608244.0, 240634.0, 38467.0, 9925.0, 3301.0, 1393.0, 619.0, 333.0, 155.0, 78.0, 49.0, 32.0, 19.0, 13.0, 15.0, 11.0, 6.0, 2.0, 2.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.128662109375, -0.12484359741210938, -0.12102508544921875, -0.11720657348632812, -0.1133880615234375, -0.10956954956054688, -0.10575103759765625, -0.10193252563476562, -0.098114013671875, -0.09429550170898438, -0.09047698974609375, -0.08665847778320312, -0.0828399658203125, -0.07902145385742188, -0.07520294189453125, -0.07138442993164062, -0.06756591796875, -0.06374740600585938, -0.05992889404296875, -0.056110382080078125, -0.0522918701171875, -0.048473358154296875, -0.04465484619140625, -0.040836334228515625, -0.037017822265625, -0.033199310302734375, -0.02938079833984375, -0.025562286376953125, -0.0217437744140625, -0.017925262451171875, -0.01410675048828125, -0.010288238525390625, -0.0064697265625, -0.002651214599609375, 0.00116729736328125, 0.004985809326171875, 0.0088043212890625, 0.012622833251953125, 0.01644134521484375, 0.020259857177734375, 0.024078369140625, 0.027896881103515625, 0.03171539306640625, 0.035533905029296875, 0.0393524169921875, 0.043170928955078125, 0.04698944091796875, 0.050807952880859375, 0.05462646484375, 0.058444976806640625, 0.06226348876953125, 0.06608200073242188, 0.0699005126953125, 0.07371902465820312, 0.07753753662109375, 0.08135604858398438, 0.085174560546875, 0.08899307250976562, 0.09281158447265625, 0.09663009643554688, 0.1004486083984375, 0.10426712036132812, 0.10808563232421875, 0.11190414428710938, 0.11572265625]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 9.0, 12.0, 8.0, 15.0, 25.0, 21.0, 42.0, 47.0, 81.0, 92.0, 149.0, 134.0, 106.0, 85.0, 49.0, 43.0, 30.0, 24.0, 11.0, 7.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.676248550415039e-05, -2.5925226509571075e-05, -2.508796751499176e-05, -2.4250708520412445e-05, -2.341344952583313e-05, -2.2576190531253815e-05, -2.17389315366745e-05, -2.0901672542095184e-05, -2.006441354751587e-05, -1.9227154552936554e-05, -1.838989555835724e-05, -1.7552636563777924e-05, -1.671537756919861e-05, -1.5878118574619293e-05, -1.5040859580039978e-05, -1.4203600585460663e-05, -1.3366341590881348e-05, -1.2529082596302032e-05, -1.1691823601722717e-05, -1.0854564607143402e-05, -1.0017305612564087e-05, -9.180046617984772e-06, -8.342787623405457e-06, -7.505528628826141e-06, -6.668269634246826e-06, -5.831010639667511e-06, -4.993751645088196e-06, -4.156492650508881e-06, -3.3192336559295654e-06, -2.4819746613502502e-06, -1.644715666770935e-06, -8.074566721916199e-07, 2.9802322387695312e-08, 8.670613169670105e-07, 1.7043203115463257e-06, 2.541579306125641e-06, 3.378838300704956e-06, 4.216097295284271e-06, 5.0533562898635864e-06, 5.890615284442902e-06, 6.727874279022217e-06, 7.565133273601532e-06, 8.402392268180847e-06, 9.239651262760162e-06, 1.0076910257339478e-05, 1.0914169251918793e-05, 1.1751428246498108e-05, 1.2588687241077423e-05, 1.3425946235656738e-05, 1.4263205230236053e-05, 1.5100464224815369e-05, 1.5937723219394684e-05, 1.6774982213974e-05, 1.7612241208553314e-05, 1.844950020313263e-05, 1.9286759197711945e-05, 2.012401819229126e-05, 2.0961277186870575e-05, 2.179853618144989e-05, 2.2635795176029205e-05, 2.347305417060852e-05, 2.4310313165187836e-05, 2.514757215976715e-05, 2.5984831154346466e-05, 2.682209014892578e-05]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 4.0, 4.0, 6.0, 11.0, 15.0, 16.0, 33.0, 44.0, 101.0, 145.0, 305.0, 639.0, 1399.0, 3277.0, 9970.0, 43700.0, 353148.0, 544833.0, 69956.0, 13450.0, 4237.0, 1661.0, 756.0, 371.0, 205.0, 96.0, 66.0, 37.0, 20.0, 12.0, 9.0, 8.0, 8.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.181884765625, -0.176849365234375, -0.17181396484375, -0.166778564453125, -0.1617431640625, -0.156707763671875, -0.15167236328125, -0.146636962890625, -0.1416015625, -0.136566162109375, -0.13153076171875, -0.126495361328125, -0.1214599609375, -0.116424560546875, -0.11138916015625, -0.106353759765625, -0.101318359375, -0.096282958984375, -0.09124755859375, -0.086212158203125, -0.0811767578125, -0.076141357421875, -0.07110595703125, -0.066070556640625, -0.06103515625, -0.055999755859375, -0.05096435546875, -0.045928955078125, -0.0408935546875, -0.035858154296875, -0.03082275390625, -0.025787353515625, -0.020751953125, -0.015716552734375, -0.01068115234375, -0.005645751953125, -0.0006103515625, 0.004425048828125, 0.00946044921875, 0.014495849609375, 0.01953125, 0.024566650390625, 0.02960205078125, 0.034637451171875, 0.0396728515625, 0.044708251953125, 0.04974365234375, 0.054779052734375, 0.059814453125, 0.064849853515625, 0.06988525390625, 0.074920654296875, 0.0799560546875, 0.084991455078125, 0.09002685546875, 0.095062255859375, 0.10009765625, 0.105133056640625, 0.11016845703125, 0.115203857421875, 0.1202392578125, 0.125274658203125, 0.13031005859375, 0.135345458984375, 0.140380859375]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 5.0, 1.0, 2.0, 3.0, 3.0, 7.0, 7.0, 5.0, 9.0, 8.0, 10.0, 15.0, 14.0, 24.0, 43.0, 46.0, 54.0, 56.0, 67.0, 93.0, 129.0, 83.0, 72.0, 53.0, 32.0, 36.0, 22.0, 15.0, 19.0, 15.0, 12.0, 14.0, 6.0, 6.0, 10.0, 3.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.037689208984375, -0.035985469818115234, -0.03428173065185547, -0.0325779914855957, -0.030874252319335938, -0.029170513153076172, -0.027466773986816406, -0.02576303482055664, -0.024059295654296875, -0.02235555648803711, -0.020651817321777344, -0.018948078155517578, -0.017244338989257812, -0.015540599822998047, -0.013836860656738281, -0.012133121490478516, -0.01042938232421875, -0.008725643157958984, -0.007021903991699219, -0.005318164825439453, -0.0036144256591796875, -0.0019106864929199219, -0.00020694732666015625, 0.0014967918395996094, 0.003200531005859375, 0.004904270172119141, 0.006608009338378906, 0.008311748504638672, 0.010015487670898438, 0.011719226837158203, 0.013422966003417969, 0.015126705169677734, 0.0168304443359375, 0.018534183502197266, 0.02023792266845703, 0.021941661834716797, 0.023645401000976562, 0.025349140167236328, 0.027052879333496094, 0.02875661849975586, 0.030460357666015625, 0.03216409683227539, 0.033867835998535156, 0.03557157516479492, 0.03727531433105469, 0.03897905349731445, 0.04068279266357422, 0.042386531829833984, 0.04409027099609375, 0.045794010162353516, 0.04749774932861328, 0.04920148849487305, 0.05090522766113281, 0.05260896682739258, 0.054312705993652344, 0.05601644515991211, 0.057720184326171875, 0.05942392349243164, 0.061127662658691406, 0.06283140182495117, 0.06453514099121094, 0.0662388801574707, 0.06794261932373047, 0.06964635848999023, 0.07135009765625]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 12.0, 31.0, 94.0, 153.0, 255.0, 230.0, 138.0, 64.0, 22.0, 11.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5363852977752686, -0.4763522744178772, -0.41631922125816345, -0.3562861979007721, -0.29625314474105835, -0.236220121383667, -0.17618709802627563, -0.11615404486656189, -0.05612102150917053, 0.003912013024091721, 0.06394504755735397, 0.12397807836532593, 0.18401111662387848, 0.24404415488243103, 0.3040771782398224, 0.36411023139953613, 0.4241432547569275, 0.48417627811431885, 0.5442093014717102, 0.6042423248291016, 0.6642754077911377, 0.724308431148529, 0.7843414545059204, 0.8443745374679565, 0.9044075012207031, 0.9644405245780945, 1.0244735479354858, 1.084506630897522, 1.1445395946502686, 1.2045726776123047, 1.2646057605743408, 1.3246387243270874, 1.3846718072891235, 1.4447048902511597, 1.5047378540039062, 1.5647709369659424, 1.624803900718689, 1.684836983680725, 1.7448699474334717, 1.8049030303955078, 1.864936113357544, 1.92496919631958, 1.9850021600723267, 2.0450351238250732, 2.1050682067871094, 2.1651012897491455, 2.2251343727111816, 2.2851674556732178, 2.345200300216675, 2.405233383178711, 2.465266466140747, 2.525299310684204, 2.5853323936462402, 2.6453654766082764, 2.7053985595703125, 2.7654316425323486, 2.8254647254943848, 2.885497808456421, 2.945530891418457, 3.005563735961914, 3.06559681892395, 3.1256299018859863, 3.1856629848480225, 3.2456960678100586, 3.3057289123535156]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 1.0, 0.0, 3.0, 6.0, 6.0, 8.0, 5.0, 6.0, 5.0, 7.0, 10.0, 15.0, 16.0, 23.0, 21.0, 37.0, 41.0, 37.0, 28.0, 40.0, 31.0, 37.0, 47.0, 42.0, 38.0, 36.0, 31.0, 39.0, 40.0, 33.0, 33.0, 35.0, 33.0, 33.0, 31.0, 17.0, 21.0, 17.0, 18.0, 18.0, 11.0, 19.0, 6.0, 12.0, 1.0, 4.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.7475723028182983, -0.7260862588882446, -0.7046001553535461, -0.6831140518188477, -0.661628007888794, -0.6401419639587402, -0.6186558604240417, -0.5971697568893433, -0.5756837129592896, -0.5541976690292358, -0.5327115654945374, -0.5112254619598389, -0.48973941802978516, -0.46825334429740906, -0.44676727056503296, -0.42528119683265686, -0.40379512310028076, -0.38230904936790466, -0.36082297563552856, -0.33933690190315247, -0.31785082817077637, -0.29636475443840027, -0.27487868070602417, -0.25339260697364807, -0.23190653324127197, -0.21042045950889587, -0.18893438577651978, -0.16744831204414368, -0.14596223831176758, -0.12447616457939148, -0.10299009084701538, -0.08150401711463928, -0.06001788377761841, -0.03853181004524231, -0.01704573631286621, 0.004440337419509888, 0.025926411151885986, 0.047412484884262085, 0.06889855861663818, 0.09038463234901428, 0.11187070608139038, 0.13335677981376648, 0.15484285354614258, 0.17632892727851868, 0.19781500101089478, 0.21930107474327087, 0.24078714847564697, 0.26227322220802307, 0.28375929594039917, 0.30524536967277527, 0.32673144340515137, 0.34821751713752747, 0.36970359086990356, 0.39118966460227966, 0.41267573833465576, 0.43416181206703186, 0.45564788579940796, 0.47713395953178406, 0.49862003326416016, 0.5201060771942139, 0.5415921807289124, 0.5630782842636108, 0.5845643281936646, 0.6060503721237183, 0.6275364756584167]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 4.0, 5.0, 6.0, 7.0, 12.0, 13.0, 11.0, 18.0, 28.0, 29.0, 42.0, 70.0, 107.0, 185.0, 428.0, 1104.0, 3181.0, 12363.0, 79582.0, 1215886.0, 2620087.0, 227272.0, 25352.0, 5595.0, 1673.0, 595.0, 245.0, 134.0, 66.0, 42.0, 33.0, 29.0, 13.0, 23.0, 18.0, 9.0, 8.0, 5.0, 7.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.65673828125, -0.6399879455566406, -0.6232376098632812, -0.6064872741699219, -0.5897369384765625, -0.5729866027832031, -0.5562362670898438, -0.5394859313964844, -0.522735595703125, -0.5059852600097656, -0.48923492431640625, -0.4724845886230469, -0.4557342529296875, -0.4389839172363281, -0.42223358154296875, -0.4054832458496094, -0.38873291015625, -0.3719825744628906, -0.35523223876953125, -0.3384819030761719, -0.3217315673828125, -0.3049812316894531, -0.28823089599609375, -0.2714805603027344, -0.254730224609375, -0.23797988891601562, -0.22122955322265625, -0.20447921752929688, -0.1877288818359375, -0.17097854614257812, -0.15422821044921875, -0.13747787475585938, -0.1207275390625, -0.10397720336914062, -0.08722686767578125, -0.07047653198242188, -0.0537261962890625, -0.036975860595703125, -0.02022552490234375, -0.003475189208984375, 0.013275146484375, 0.030025482177734375, 0.04677581787109375, 0.06352615356445312, 0.0802764892578125, 0.09702682495117188, 0.11377716064453125, 0.13052749633789062, 0.14727783203125, 0.16402816772460938, 0.18077850341796875, 0.19752883911132812, 0.2142791748046875, 0.23102951049804688, 0.24777984619140625, 0.2645301818847656, 0.281280517578125, 0.2980308532714844, 0.31478118896484375, 0.3315315246582031, 0.3482818603515625, 0.3650321960449219, 0.38178253173828125, 0.3985328674316406, 0.415283203125]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 2.0, 4.0, 4.0, 7.0, 10.0, 11.0, 10.0, 17.0, 19.0, 9.0, 28.0, 21.0, 23.0, 28.0, 46.0, 34.0, 36.0, 41.0, 31.0, 54.0, 40.0, 45.0, 43.0, 33.0, 42.0, 28.0, 46.0, 27.0, 39.0, 34.0, 30.0, 35.0, 16.0, 16.0, 14.0, 16.0, 14.0, 10.0, 10.0, 13.0, 7.0, 6.0, 0.0, 2.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.22265625, -0.21603775024414062, -0.20941925048828125, -0.20280075073242188, -0.1961822509765625, -0.18956375122070312, -0.18294525146484375, -0.17632675170898438, -0.169708251953125, -0.16308975219726562, -0.15647125244140625, -0.14985275268554688, -0.1432342529296875, -0.13661575317382812, -0.12999725341796875, -0.12337875366210938, -0.11676025390625, -0.11014175415039062, -0.10352325439453125, -0.09690475463867188, -0.0902862548828125, -0.08366775512695312, -0.07704925537109375, -0.07043075561523438, -0.063812255859375, -0.057193756103515625, -0.05057525634765625, -0.043956756591796875, -0.0373382568359375, -0.030719757080078125, -0.02410125732421875, -0.017482757568359375, -0.0108642578125, -0.004245758056640625, 0.00237274169921875, 0.008991241455078125, 0.0156097412109375, 0.022228240966796875, 0.02884674072265625, 0.035465240478515625, 0.042083740234375, 0.048702239990234375, 0.05532073974609375, 0.061939239501953125, 0.0685577392578125, 0.07517623901367188, 0.08179473876953125, 0.08841323852539062, 0.09503173828125, 0.10165023803710938, 0.10826873779296875, 0.11488723754882812, 0.1215057373046875, 0.12812423706054688, 0.13474273681640625, 0.14136123657226562, 0.147979736328125, 0.15459823608398438, 0.16121673583984375, 0.16783523559570312, 0.1744537353515625, 0.18107223510742188, 0.18769073486328125, 0.19430923461914062, 0.200927734375]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 7.0, 18.0, 24.0, 36.0, 96.0, 246.0, 560.0, 1908.0, 11557.0, 690046.0, 3452386.0, 32813.0, 3128.0, 855.0, 315.0, 145.0, 52.0, 26.0, 26.0, 13.0, 9.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.056640625, -1.0227508544921875, -0.988861083984375, -0.9549713134765625, -0.92108154296875, -0.8871917724609375, -0.853302001953125, -0.8194122314453125, -0.7855224609375, -0.7516326904296875, -0.717742919921875, -0.6838531494140625, -0.64996337890625, -0.6160736083984375, -0.582183837890625, -0.5482940673828125, -0.514404296875, -0.4805145263671875, -0.446624755859375, -0.4127349853515625, -0.37884521484375, -0.3449554443359375, -0.311065673828125, -0.2771759033203125, -0.2432861328125, -0.2093963623046875, -0.175506591796875, -0.1416168212890625, -0.10772705078125, -0.0738372802734375, -0.039947509765625, -0.0060577392578125, 0.02783203125, 0.0617218017578125, 0.095611572265625, 0.1295013427734375, 0.16339111328125, 0.1972808837890625, 0.231170654296875, 0.2650604248046875, 0.2989501953125, 0.3328399658203125, 0.366729736328125, 0.4006195068359375, 0.43450927734375, 0.4683990478515625, 0.502288818359375, 0.5361785888671875, 0.570068359375, 0.6039581298828125, 0.637847900390625, 0.6717376708984375, 0.70562744140625, 0.7395172119140625, 0.773406982421875, 0.8072967529296875, 0.8411865234375, 0.8750762939453125, 0.908966064453125, 0.9428558349609375, 0.97674560546875, 1.0106353759765625, 1.044525146484375, 1.0784149169921875, 1.1123046875]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 2.0, 2.0, 12.0, 3.0, 11.0, 18.0, 17.0, 50.0, 54.0, 69.0, 121.0, 207.0, 261.0, 368.0, 487.0, 559.0, 519.0, 411.0, 278.0, 227.0, 138.0, 87.0, 44.0, 45.0, 27.0, 20.0, 10.0, 8.0, 12.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1324462890625, -0.12764739990234375, -0.1228485107421875, -0.11804962158203125, -0.113250732421875, -0.10845184326171875, -0.1036529541015625, -0.09885406494140625, -0.09405517578125, -0.08925628662109375, -0.0844573974609375, -0.07965850830078125, -0.074859619140625, -0.07006072998046875, -0.0652618408203125, -0.06046295166015625, -0.0556640625, -0.05086517333984375, -0.0460662841796875, -0.04126739501953125, -0.036468505859375, -0.03166961669921875, -0.0268707275390625, -0.02207183837890625, -0.01727294921875, -0.01247406005859375, -0.0076751708984375, -0.00287628173828125, 0.001922607421875, 0.00672149658203125, 0.0115203857421875, 0.01631927490234375, 0.0211181640625, 0.02591705322265625, 0.0307159423828125, 0.03551483154296875, 0.040313720703125, 0.04511260986328125, 0.0499114990234375, 0.05471038818359375, 0.05950927734375, 0.06430816650390625, 0.0691070556640625, 0.07390594482421875, 0.078704833984375, 0.08350372314453125, 0.0883026123046875, 0.09310150146484375, 0.097900390625, 0.10269927978515625, 0.1074981689453125, 0.11229705810546875, 0.117095947265625, 0.12189483642578125, 0.1266937255859375, 0.13149261474609375, 0.13629150390625, 0.14109039306640625, 0.1458892822265625, 0.15068817138671875, 0.155487060546875, 0.16028594970703125, 0.1650848388671875, 0.16988372802734375, 0.1746826171875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 1.0, 6.0, 8.0, 11.0, 7.0, 10.0, 13.0, 15.0, 22.0, 28.0, 35.0, 31.0, 38.0, 47.0, 37.0, 35.0, 70.0, 50.0, 60.0, 48.0, 53.0, 45.0, 59.0, 51.0, 37.0, 26.0, 30.0, 19.0, 21.0, 18.0, 15.0, 16.0, 13.0, 7.0, 6.0, 5.0, 1.0, 6.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.3278948962688446, -0.3179178535938263, -0.3079407811164856, -0.2979637384414673, -0.287986695766449, -0.2780096232891083, -0.26803258061408997, -0.25805550813674927, -0.24807846546173096, -0.23810140788555145, -0.22812435030937195, -0.21814730763435364, -0.20817025005817413, -0.19819319248199463, -0.18821614980697632, -0.17823909223079681, -0.1682620346546173, -0.1582849770784378, -0.1483079195022583, -0.13833087682724, -0.12835381925106049, -0.11837676167488098, -0.10839971154928207, -0.09842266142368317, -0.08844560384750366, -0.07846854627132416, -0.06849149614572525, -0.058514442294836044, -0.04853738844394684, -0.03856033459305763, -0.028583280742168427, -0.01860623061656952, -0.008629143238067627, 0.001347910612821579, 0.011324964463710785, 0.02130201831459999, 0.0312790721654892, 0.0412561260163784, 0.05123317986726761, 0.061210229992866516, 0.07118728756904602, 0.08116434514522552, 0.09114139527082443, 0.10111844539642334, 0.11109550297260284, 0.12107256054878235, 0.13104960322380066, 0.14102666079998016, 0.15100371837615967, 0.16098077595233917, 0.17095783352851868, 0.180934876203537, 0.1909119337797165, 0.200888991355896, 0.2108660340309143, 0.2208430916070938, 0.23082014918327332, 0.24079720675945282, 0.2507742643356323, 0.26075130701065063, 0.27072834968566895, 0.28070542216300964, 0.29068246483802795, 0.30065953731536865, 0.31063657999038696]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 4.0, 4.0, 3.0, 5.0, 3.0, 5.0, 6.0, 5.0, 17.0, 9.0, 6.0, 8.0, 12.0, 17.0, 17.0, 17.0, 25.0, 24.0, 27.0, 32.0, 39.0, 32.0, 39.0, 37.0, 29.0, 42.0, 33.0, 37.0, 44.0, 30.0, 40.0, 33.0, 35.0, 24.0, 24.0, 22.0, 26.0, 32.0, 31.0, 24.0, 17.0, 21.0, 17.0, 11.0, 15.0, 5.0, 4.0, 4.0, 7.0, 6.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.26479968428611755, -0.25700971484184265, -0.24921973049640656, -0.24142974615097046, -0.23363977670669556, -0.22584979236125946, -0.21805980801582336, -0.21026983857154846, -0.20247985422611237, -0.19468986988067627, -0.18689990043640137, -0.17910991609096527, -0.17131993174552917, -0.16352996230125427, -0.15573997795581818, -0.14794999361038208, -0.14016002416610718, -0.13237003982067108, -0.12458007037639618, -0.11679008603096008, -0.10900010913610458, -0.10121013224124908, -0.09342014789581299, -0.08563017100095749, -0.07784019410610199, -0.07005021721124649, -0.06226023659110069, -0.054470255970954895, -0.046680279076099396, -0.038890302181243896, -0.0311003215610981, -0.0233103409409523, -0.015520364046096802, -0.007730385288596153, 5.959346890449524e-05, 0.007849572226405144, 0.015639550983905792, 0.02342952787876129, 0.03121950849890709, 0.03900948911905289, 0.046799466013908386, 0.054589442908763885, 0.06237942352890968, 0.07016940414905548, 0.07795938104391098, 0.08574935793876648, 0.09353934228420258, 0.10132931917905807, 0.10911929607391357, 0.11690927296876907, 0.12469924986362457, 0.13248923420906067, 0.14027920365333557, 0.14806918799877167, 0.15585917234420776, 0.16364914178848267, 0.17143912613391876, 0.17922911047935486, 0.18701907992362976, 0.19480906426906586, 0.20259904861450195, 0.21038901805877686, 0.21817900240421295, 0.22596898674964905, 0.23375895619392395]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 1.0, 4.0, 6.0, 5.0, 5.0, 16.0, 30.0, 31.0, 37.0, 48.0, 97.0, 127.0, 173.0, 297.0, 430.0, 623.0, 931.0, 1433.0, 2208.0, 3395.0, 5096.0, 7739.0, 11739.0, 21646.0, 59683.0, 207997.0, 394308.0, 212392.0, 61132.0, 21872.0, 11971.0, 7784.0, 5264.0, 3459.0, 2224.0, 1515.0, 958.0, 652.0, 388.0, 282.0, 173.0, 107.0, 82.0, 65.0, 35.0, 29.0, 25.0, 13.0, 16.0, 7.0, 2.0, 1.0, 1.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.07598876953125, -0.07341384887695312, -0.07083892822265625, -0.06826400756835938, -0.0656890869140625, -0.06311416625976562, -0.06053924560546875, -0.057964324951171875, -0.055389404296875, -0.052814483642578125, -0.05023956298828125, -0.047664642333984375, -0.0450897216796875, -0.042514801025390625, -0.03993988037109375, -0.037364959716796875, -0.0347900390625, -0.032215118408203125, -0.02964019775390625, -0.027065277099609375, -0.0244903564453125, -0.021915435791015625, -0.01934051513671875, -0.016765594482421875, -0.014190673828125, -0.011615753173828125, -0.00904083251953125, -0.006465911865234375, -0.0038909912109375, -0.001316070556640625, 0.00125885009765625, 0.003833770751953125, 0.00640869140625, 0.008983612060546875, 0.01155853271484375, 0.014133453369140625, 0.0167083740234375, 0.019283294677734375, 0.02185821533203125, 0.024433135986328125, 0.027008056640625, 0.029582977294921875, 0.03215789794921875, 0.034732818603515625, 0.0373077392578125, 0.039882659912109375, 0.04245758056640625, 0.045032501220703125, 0.047607421875, 0.050182342529296875, 0.05275726318359375, 0.055332183837890625, 0.0579071044921875, 0.060482025146484375, 0.06305694580078125, 0.06563186645507812, 0.068206787109375, 0.07078170776367188, 0.07335662841796875, 0.07593154907226562, 0.0785064697265625, 0.08108139038085938, 0.08365631103515625, 0.08623123168945312, 0.08880615234375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 0.0, 5.0, 4.0, 3.0, 5.0, 8.0, 11.0, 12.0, 8.0, 14.0, 12.0, 16.0, 12.0, 22.0, 24.0, 20.0, 33.0, 35.0, 33.0, 40.0, 32.0, 35.0, 36.0, 44.0, 34.0, 37.0, 47.0, 38.0, 36.0, 26.0, 39.0, 17.0, 30.0, 37.0, 16.0, 28.0, 19.0, 26.0, 14.0, 21.0, 18.0, 11.0, 10.0, 16.0, 5.0, 8.0, 5.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.1614990234375, -0.15656661987304688, -0.15163421630859375, -0.14670181274414062, -0.1417694091796875, -0.13683700561523438, -0.13190460205078125, -0.12697219848632812, -0.122039794921875, -0.11710739135742188, -0.11217498779296875, -0.10724258422851562, -0.1023101806640625, -0.09737777709960938, -0.09244537353515625, -0.08751296997070312, -0.08258056640625, -0.07764816284179688, -0.07271575927734375, -0.06778335571289062, -0.0628509521484375, -0.057918548583984375, -0.05298614501953125, -0.048053741455078125, -0.043121337890625, -0.038188934326171875, -0.03325653076171875, -0.028324127197265625, -0.0233917236328125, -0.018459320068359375, -0.01352691650390625, -0.008594512939453125, -0.003662109375, 0.001270294189453125, 0.00620269775390625, 0.011135101318359375, 0.0160675048828125, 0.020999908447265625, 0.02593231201171875, 0.030864715576171875, 0.035797119140625, 0.040729522705078125, 0.04566192626953125, 0.050594329833984375, 0.0555267333984375, 0.060459136962890625, 0.06539154052734375, 0.07032394409179688, 0.07525634765625, 0.08018875122070312, 0.08512115478515625, 0.09005355834960938, 0.0949859619140625, 0.09991836547851562, 0.10485076904296875, 0.10978317260742188, 0.114715576171875, 0.11964797973632812, 0.12458038330078125, 0.12951278686523438, 0.1344451904296875, 0.13937759399414062, 0.14430999755859375, 0.14924240112304688, 0.1541748046875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 5.0, 5.0, 4.0, 9.0, 13.0, 16.0, 22.0, 39.0, 42.0, 73.0, 99.0, 159.0, 241.0, 386.0, 633.0, 1140.0, 1982.0, 3690.0, 7371.0, 16338.0, 42353.0, 147229.0, 404680.0, 288805.0, 82929.0, 26900.0, 11408.0, 5374.0, 2841.0, 1505.0, 875.0, 482.0, 303.0, 204.0, 115.0, 94.0, 54.0, 39.0, 29.0, 19.0, 18.0, 6.0, 7.0, 5.0, 2.0, 2.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.07366943359375, -0.07119560241699219, -0.06872177124023438, -0.06624794006347656, -0.06377410888671875, -0.06130027770996094, -0.058826446533203125, -0.05635261535644531, -0.0538787841796875, -0.05140495300292969, -0.048931121826171875, -0.04645729064941406, -0.04398345947265625, -0.04150962829589844, -0.039035797119140625, -0.03656196594238281, -0.034088134765625, -0.03161430358886719, -0.029140472412109375, -0.026666641235351562, -0.02419281005859375, -0.021718978881835938, -0.019245147705078125, -0.016771316528320312, -0.0142974853515625, -0.011823654174804688, -0.009349822998046875, -0.0068759918212890625, -0.00440216064453125, -0.0019283294677734375, 0.000545501708984375, 0.0030193328857421875, 0.0054931640625, 0.007966995239257812, 0.010440826416015625, 0.012914657592773438, 0.01538848876953125, 0.017862319946289062, 0.020336151123046875, 0.022809982299804688, 0.0252838134765625, 0.027757644653320312, 0.030231475830078125, 0.03270530700683594, 0.03517913818359375, 0.03765296936035156, 0.040126800537109375, 0.04260063171386719, 0.045074462890625, 0.04754829406738281, 0.050022125244140625, 0.05249595642089844, 0.05496978759765625, 0.05744361877441406, 0.059917449951171875, 0.06239128112792969, 0.0648651123046875, 0.06733894348144531, 0.06981277465820312, 0.07228660583496094, 0.07476043701171875, 0.07723426818847656, 0.07970809936523438, 0.08218193054199219, 0.08465576171875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 2.0, 7.0, 7.0, 5.0, 6.0, 9.0, 8.0, 11.0, 17.0, 12.0, 7.0, 23.0, 28.0, 26.0, 26.0, 28.0, 44.0, 54.0, 31.0, 32.0, 47.0, 56.0, 35.0, 50.0, 52.0, 39.0, 47.0, 33.0, 43.0, 25.0, 36.0, 27.0, 26.0, 20.0, 19.0, 7.0, 12.0, 12.0, 6.0, 11.0, 5.0, 3.0, 3.0, 3.0, 4.0, 1.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.441650390625, -0.4284095764160156, -0.41516876220703125, -0.4019279479980469, -0.3886871337890625, -0.3754463195800781, -0.36220550537109375, -0.3489646911621094, -0.335723876953125, -0.3224830627441406, -0.30924224853515625, -0.2960014343261719, -0.2827606201171875, -0.2695198059082031, -0.25627899169921875, -0.24303817749023438, -0.22979736328125, -0.21655654907226562, -0.20331573486328125, -0.19007492065429688, -0.1768341064453125, -0.16359329223632812, -0.15035247802734375, -0.13711166381835938, -0.123870849609375, -0.11063003540039062, -0.09738922119140625, -0.08414840698242188, -0.0709075927734375, -0.057666778564453125, -0.04442596435546875, -0.031185150146484375, -0.0179443359375, -0.004703521728515625, 0.00853729248046875, 0.021778106689453125, 0.0350189208984375, 0.048259735107421875, 0.06150054931640625, 0.07474136352539062, 0.087982177734375, 0.10122299194335938, 0.11446380615234375, 0.12770462036132812, 0.1409454345703125, 0.15418624877929688, 0.16742706298828125, 0.18066787719726562, 0.19390869140625, 0.20714950561523438, 0.22039031982421875, 0.23363113403320312, 0.2468719482421875, 0.2601127624511719, 0.27335357666015625, 0.2865943908691406, 0.299835205078125, 0.3130760192871094, 0.32631683349609375, 0.3395576477050781, 0.3527984619140625, 0.3660392761230469, 0.37928009033203125, 0.3925209045410156, 0.40576171875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 8.0, 7.0, 11.0, 7.0, 15.0, 25.0, 52.0, 61.0, 104.0, 171.0, 380.0, 621.0, 1297.0, 2608.0, 5886.0, 16039.0, 65488.0, 446853.0, 422027.0, 60863.0, 15243.0, 5822.0, 2385.0, 1221.0, 543.0, 330.0, 182.0, 111.0, 73.0, 42.0, 28.0, 20.0, 14.0, 9.0, 3.0, 4.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.05694580078125, -0.05531787872314453, -0.05368995666503906, -0.052062034606933594, -0.050434112548828125, -0.048806190490722656, -0.04717826843261719, -0.04555034637451172, -0.04392242431640625, -0.04229450225830078, -0.04066658020019531, -0.039038658142089844, -0.037410736083984375, -0.035782814025878906, -0.03415489196777344, -0.03252696990966797, -0.0308990478515625, -0.02927112579345703, -0.027643203735351562, -0.026015281677246094, -0.024387359619140625, -0.022759437561035156, -0.021131515502929688, -0.01950359344482422, -0.01787567138671875, -0.01624774932861328, -0.014619827270507812, -0.012991905212402344, -0.011363983154296875, -0.009736061096191406, -0.008108139038085938, -0.006480216979980469, -0.004852294921875, -0.0032243728637695312, -0.0015964508056640625, 3.147125244140625e-05, 0.001659393310546875, 0.0032873153686523438, 0.0049152374267578125, 0.006543159484863281, 0.00817108154296875, 0.009799003601074219, 0.011426925659179688, 0.013054847717285156, 0.014682769775390625, 0.016310691833496094, 0.017938613891601562, 0.01956653594970703, 0.0211944580078125, 0.02282238006591797, 0.024450302124023438, 0.026078224182128906, 0.027706146240234375, 0.029334068298339844, 0.030961990356445312, 0.03258991241455078, 0.03421783447265625, 0.03584575653076172, 0.03747367858886719, 0.039101600646972656, 0.040729522705078125, 0.042357444763183594, 0.04398536682128906, 0.04561328887939453, 0.0472412109375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 3.0, 7.0, 7.0, 10.0, 13.0, 8.0, 37.0, 54.0, 89.0, 92.0, 131.0, 143.0, 139.0, 92.0, 51.0, 33.0, 26.0, 14.0, 9.0, 4.0, 7.0, 3.0, 6.0, 9.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.063678741455078e-05, -2.978648990392685e-05, -2.8936192393302917e-05, -2.8085894882678986e-05, -2.7235597372055054e-05, -2.6385299861431122e-05, -2.553500235080719e-05, -2.4684704840183258e-05, -2.3834407329559326e-05, -2.2984109818935394e-05, -2.2133812308311462e-05, -2.128351479768753e-05, -2.04332172870636e-05, -1.9582919776439667e-05, -1.8732622265815735e-05, -1.7882324755191803e-05, -1.703202724456787e-05, -1.618172973394394e-05, -1.5331432223320007e-05, -1.4481134712696075e-05, -1.3630837202072144e-05, -1.2780539691448212e-05, -1.193024218082428e-05, -1.1079944670200348e-05, -1.0229647159576416e-05, -9.379349648952484e-06, -8.529052138328552e-06, -7.67875462770462e-06, -6.8284571170806885e-06, -5.978159606456757e-06, -5.127862095832825e-06, -4.277564585208893e-06, -3.427267074584961e-06, -2.576969563961029e-06, -1.7266720533370972e-06, -8.763745427131653e-07, -2.60770320892334e-08, 8.242204785346985e-07, 1.6745179891586304e-06, 2.5248154997825623e-06, 3.375113010406494e-06, 4.225410521030426e-06, 5.075708031654358e-06, 5.92600554227829e-06, 6.776303052902222e-06, 7.6266005635261536e-06, 8.476898074150085e-06, 9.327195584774017e-06, 1.017749309539795e-05, 1.1027790606021881e-05, 1.1878088116645813e-05, 1.2728385627269745e-05, 1.3578683137893677e-05, 1.4428980648517609e-05, 1.527927815914154e-05, 1.6129575669765472e-05, 1.6979873180389404e-05, 1.7830170691013336e-05, 1.8680468201637268e-05, 1.95307657122612e-05, 2.0381063222885132e-05, 2.1231360733509064e-05, 2.2081658244132996e-05, 2.2931955754756927e-05, 2.378225326538086e-05]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 3.0, 4.0, 9.0, 17.0, 18.0, 28.0, 35.0, 65.0, 112.0, 157.0, 292.0, 540.0, 883.0, 1534.0, 2859.0, 5364.0, 11616.0, 26500.0, 73937.0, 221073.0, 374496.0, 210661.0, 70244.0, 25643.0, 10862.0, 5357.0, 2662.0, 1516.0, 835.0, 459.0, 284.0, 184.0, 108.0, 68.0, 56.0, 41.0, 11.0, 8.0, 5.0, 4.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.036468505859375, -0.03537893295288086, -0.03428936004638672, -0.03319978713989258, -0.03211021423339844, -0.031020641326904297, -0.029931068420410156, -0.028841495513916016, -0.027751922607421875, -0.026662349700927734, -0.025572776794433594, -0.024483203887939453, -0.023393630981445312, -0.022304058074951172, -0.02121448516845703, -0.02012491226196289, -0.01903533935546875, -0.01794576644897461, -0.01685619354248047, -0.015766620635986328, -0.014677047729492188, -0.013587474822998047, -0.012497901916503906, -0.011408329010009766, -0.010318756103515625, -0.009229183197021484, -0.008139610290527344, -0.007050037384033203, -0.0059604644775390625, -0.004870891571044922, -0.0037813186645507812, -0.0026917457580566406, -0.0016021728515625, -0.0005125999450683594, 0.0005769729614257812, 0.0016665458679199219, 0.0027561187744140625, 0.003845691680908203, 0.004935264587402344, 0.006024837493896484, 0.007114410400390625, 0.008203983306884766, 0.009293556213378906, 0.010383129119873047, 0.011472702026367188, 0.012562274932861328, 0.013651847839355469, 0.01474142074584961, 0.01583099365234375, 0.01692056655883789, 0.01801013946533203, 0.019099712371826172, 0.020189285278320312, 0.021278858184814453, 0.022368431091308594, 0.023458003997802734, 0.024547576904296875, 0.025637149810791016, 0.026726722717285156, 0.027816295623779297, 0.028905868530273438, 0.029995441436767578, 0.03108501434326172, 0.03217458724975586, 0.03326416015625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 3.0, 9.0, 8.0, 6.0, 18.0, 14.0, 33.0, 54.0, 69.0, 95.0, 93.0, 138.0, 111.0, 99.0, 71.0, 58.0, 36.0, 26.0, 13.0, 13.0, 12.0, 12.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01428985595703125, -0.01380765438079834, -0.01332545280456543, -0.01284325122833252, -0.01236104965209961, -0.0118788480758667, -0.011396646499633789, -0.010914444923400879, -0.010432243347167969, -0.009950041770935059, -0.009467840194702148, -0.008985638618469238, -0.008503437042236328, -0.008021235466003418, -0.007539033889770508, -0.007056832313537598, -0.0065746307373046875, -0.006092429161071777, -0.005610227584838867, -0.005128026008605957, -0.004645824432373047, -0.004163622856140137, -0.0036814212799072266, -0.0031992197036743164, -0.0027170181274414062, -0.002234816551208496, -0.001752614974975586, -0.0012704133987426758, -0.0007882118225097656, -0.00030601024627685547, 0.0001761913299560547, 0.0006583929061889648, 0.001140594482421875, 0.0016227960586547852, 0.0021049976348876953, 0.0025871992111206055, 0.0030694007873535156, 0.0035516023635864258, 0.004033803939819336, 0.004516005516052246, 0.004998207092285156, 0.005480408668518066, 0.0059626102447509766, 0.006444811820983887, 0.006927013397216797, 0.007409214973449707, 0.007891416549682617, 0.008373618125915527, 0.008855819702148438, 0.009338021278381348, 0.009820222854614258, 0.010302424430847168, 0.010784626007080078, 0.011266827583312988, 0.011749029159545898, 0.012231230735778809, 0.012713432312011719, 0.013195633888244629, 0.013677835464477539, 0.01416003704071045, 0.01464223861694336, 0.01512444019317627, 0.01560664176940918, 0.01608884334564209, 0.016571044921875]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 3.0, 8.0, 17.0, 18.0, 23.0, 18.0, 23.0, 36.0, 43.0, 44.0, 61.0, 70.0, 67.0, 49.0, 61.0, 62.0, 58.0, 70.0, 43.0, 45.0, 26.0, 28.0, 20.0, 16.0, 19.0, 21.0, 13.0, 8.0, 11.0, 8.0, 1.0, 3.0, 1.0, 3.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.23547668755054474, -0.22861741483211517, -0.2217581421136856, -0.21489888429641724, -0.20803961157798767, -0.2011803388595581, -0.19432106614112854, -0.18746179342269897, -0.1806025207042694, -0.17374324798583984, -0.16688397526741028, -0.1600247025489807, -0.15316544473171234, -0.14630617201328278, -0.1394468992948532, -0.13258762657642365, -0.12572836875915527, -0.11886909604072571, -0.11200983077287674, -0.10515055805444717, -0.0982912927865982, -0.09143202006816864, -0.08457274734973907, -0.07771347463130951, -0.07085420936346054, -0.06399493664503098, -0.05713567137718201, -0.05027639865875244, -0.043417129665613174, -0.03655786067247391, -0.029698587954044342, -0.022839318960905075, -0.015980035066604614, -0.009120765142142773, -0.002261495217680931, 0.004597775638103485, 0.011457044631242752, 0.01831631362438202, 0.025175586342811584, 0.03203485533595085, 0.03889412432909012, 0.045753393322229385, 0.05261266231536865, 0.05947193503379822, 0.06633120775222778, 0.07319047302007675, 0.08004974573850632, 0.08690901100635529, 0.09376828372478485, 0.10062755644321442, 0.10748682171106339, 0.11434609442949295, 0.12120535969734192, 0.12806463241577148, 0.13492390513420105, 0.14178317785263062, 0.14864245057106018, 0.15550172328948975, 0.1623609960079193, 0.16922026872634888, 0.17607952654361725, 0.18293879926204681, 0.18979807198047638, 0.19665734469890594, 0.20351660251617432]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 5.0, 0.0, 2.0, 8.0, 2.0, 9.0, 9.0, 9.0, 10.0, 7.0, 7.0, 10.0, 10.0, 20.0, 19.0, 17.0, 22.0, 31.0, 27.0, 30.0, 33.0, 29.0, 35.0, 36.0, 40.0, 43.0, 35.0, 38.0, 33.0, 30.0, 26.0, 37.0, 30.0, 42.0, 30.0, 18.0, 23.0, 33.0, 16.0, 29.0, 24.0, 21.0, 12.0, 15.0, 8.0, 8.0, 8.0, 2.0, 2.0, 2.0, 8.0, 3.0, 3.0, 2.0, 1.0, 1.0, 4.0], "bins": [-0.15810687839984894, -0.15346482396125793, -0.14882275462150574, -0.14418070018291473, -0.13953863084316254, -0.13489657640457153, -0.13025450706481934, -0.12561245262622833, -0.12097039818763733, -0.11632833629846573, -0.11168627440929413, -0.10704421997070312, -0.10240215808153152, -0.09776009619235992, -0.09311803430318832, -0.08847597241401672, -0.08383391052484512, -0.07919184863567352, -0.07454978674650192, -0.06990772485733032, -0.06526567041873932, -0.06062360852956772, -0.05598154664039612, -0.051339488476514816, -0.046697426587343216, -0.042055364698171616, -0.037413306534290314, -0.03277124464511871, -0.028129184618592262, -0.02348712459206581, -0.01884506270289421, -0.014203004539012909, -0.009560942649841309, -0.00491888215765357, -0.00027682166546583176, 0.004365239292383194, 0.009007299318909645, 0.013649359345436096, 0.018291421234607697, 0.022933479398489, 0.0275755412876606, 0.0322176031768322, 0.0368596613407135, 0.0415017232298851, 0.0461437851190567, 0.050785843282938004, 0.055427905172109604, 0.060069963335990906, 0.0647120252251625, 0.0693540871143341, 0.0739961490035057, 0.07863821089267731, 0.08328026533126831, 0.08792232722043991, 0.09256438910961151, 0.09720644354820251, 0.10184851288795471, 0.10649057477712631, 0.11113263666629791, 0.11577469110488892, 0.12041675299406052, 0.12505881488323212, 0.12970086932182312, 0.13434293866157532, 0.13898499310016632]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 7.0, 11.0, 6.0, 8.0, 15.0, 24.0, 45.0, 39.0, 44.0, 87.0, 157.0, 244.0, 416.0, 764.0, 1369.0, 2934.0, 6321.0, 14511.0, 34374.0, 82336.0, 186127.0, 300789.0, 229708.0, 107689.0, 45503.0, 19071.0, 8335.0, 3694.0, 1700.0, 933.0, 485.0, 282.0, 180.0, 107.0, 88.0, 53.0, 31.0, 20.0, 15.0, 12.0, 13.0, 1.0, 4.0, 4.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2607421875, -0.2516441345214844, -0.24254608154296875, -0.23344802856445312, -0.2243499755859375, -0.21525192260742188, -0.20615386962890625, -0.19705581665039062, -0.187957763671875, -0.17885971069335938, -0.16976165771484375, -0.16066360473632812, -0.1515655517578125, -0.14246749877929688, -0.13336944580078125, -0.12427139282226562, -0.11517333984375, -0.10607528686523438, -0.09697723388671875, -0.08787918090820312, -0.0787811279296875, -0.06968307495117188, -0.06058502197265625, -0.051486968994140625, -0.042388916015625, -0.033290863037109375, -0.02419281005859375, -0.015094757080078125, -0.0059967041015625, 0.003101348876953125, 0.01219940185546875, 0.021297454833984375, 0.0303955078125, 0.039493560791015625, 0.04859161376953125, 0.057689666748046875, 0.0667877197265625, 0.07588577270507812, 0.08498382568359375, 0.09408187866210938, 0.103179931640625, 0.11227798461914062, 0.12137603759765625, 0.13047409057617188, 0.1395721435546875, 0.14867019653320312, 0.15776824951171875, 0.16686630249023438, 0.17596435546875, 0.18506240844726562, 0.19416046142578125, 0.20325851440429688, 0.2123565673828125, 0.22145462036132812, 0.23055267333984375, 0.23965072631835938, 0.248748779296875, 0.2578468322753906, 0.26694488525390625, 0.2760429382324219, 0.2851409912109375, 0.2942390441894531, 0.30333709716796875, 0.3124351501464844, 0.321533203125]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 5.0, 3.0, 11.0, 8.0, 10.0, 8.0, 4.0, 14.0, 16.0, 18.0, 27.0, 22.0, 24.0, 38.0, 44.0, 51.0, 35.0, 43.0, 47.0, 44.0, 52.0, 40.0, 58.0, 49.0, 46.0, 32.0, 27.0, 35.0, 37.0, 36.0, 25.0, 23.0, 17.0, 14.0, 13.0, 7.0, 4.0, 6.0, 5.0, 3.0, 3.0, 2.0, 0.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.28662109375, -0.27622222900390625, -0.2658233642578125, -0.25542449951171875, -0.245025634765625, -0.23462677001953125, -0.2242279052734375, -0.21382904052734375, -0.20343017578125, -0.19303131103515625, -0.1826324462890625, -0.17223358154296875, -0.161834716796875, -0.15143585205078125, -0.1410369873046875, -0.13063812255859375, -0.1202392578125, -0.10984039306640625, -0.0994415283203125, -0.08904266357421875, -0.078643798828125, -0.06824493408203125, -0.0578460693359375, -0.04744720458984375, -0.03704833984375, -0.02664947509765625, -0.0162506103515625, -0.00585174560546875, 0.004547119140625, 0.01494598388671875, 0.0253448486328125, 0.03574371337890625, 0.046142578125, 0.05654144287109375, 0.0669403076171875, 0.07733917236328125, 0.087738037109375, 0.09813690185546875, 0.1085357666015625, 0.11893463134765625, 0.12933349609375, 0.13973236083984375, 0.1501312255859375, 0.16053009033203125, 0.170928955078125, 0.18132781982421875, 0.1917266845703125, 0.20212554931640625, 0.2125244140625, 0.22292327880859375, 0.2333221435546875, 0.24372100830078125, 0.254119873046875, 0.26451873779296875, 0.2749176025390625, 0.28531646728515625, 0.29571533203125, 0.30611419677734375, 0.3165130615234375, 0.32691192626953125, 0.337310791015625, 0.34770965576171875, 0.3581085205078125, 0.36850738525390625, 0.37890625]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 5.0, 3.0, 5.0, 15.0, 20.0, 16.0, 18.0, 26.0, 40.0, 50.0, 65.0, 90.0, 141.0, 163.0, 309.0, 451.0, 846.0, 1739.0, 4143.0, 10876.0, 30521.0, 88275.0, 238448.0, 366400.0, 195321.0, 70351.0, 24455.0, 8915.0, 3411.0, 1425.0, 758.0, 420.0, 250.0, 143.0, 111.0, 90.0, 67.0, 45.0, 34.0, 24.0, 23.0, 19.0, 13.0, 7.0, 7.0, 2.0, 5.0, 1.0, 0.0, 3.0, 3.0], "bins": [-0.429931640625, -0.4181175231933594, -0.40630340576171875, -0.3944892883300781, -0.3826751708984375, -0.3708610534667969, -0.35904693603515625, -0.3472328186035156, -0.335418701171875, -0.3236045837402344, -0.31179046630859375, -0.2999763488769531, -0.2881622314453125, -0.2763481140136719, -0.26453399658203125, -0.2527198791503906, -0.24090576171875, -0.22909164428710938, -0.21727752685546875, -0.20546340942382812, -0.1936492919921875, -0.18183517456054688, -0.17002105712890625, -0.15820693969726562, -0.146392822265625, -0.13457870483398438, -0.12276458740234375, -0.11095046997070312, -0.0991363525390625, -0.08732223510742188, -0.07550811767578125, -0.06369400024414062, -0.0518798828125, -0.040065765380859375, -0.02825164794921875, -0.016437530517578125, -0.0046234130859375, 0.007190704345703125, 0.01900482177734375, 0.030818939208984375, 0.042633056640625, 0.054447174072265625, 0.06626129150390625, 0.07807540893554688, 0.0898895263671875, 0.10170364379882812, 0.11351776123046875, 0.12533187866210938, 0.13714599609375, 0.14896011352539062, 0.16077423095703125, 0.17258834838867188, 0.1844024658203125, 0.19621658325195312, 0.20803070068359375, 0.21984481811523438, 0.231658935546875, 0.24347305297851562, 0.25528717041015625, 0.2671012878417969, 0.2789154052734375, 0.2907295227050781, 0.30254364013671875, 0.3143577575683594, 0.326171875]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 7.0, 4.0, 9.0, 5.0, 6.0, 8.0, 16.0, 14.0, 15.0, 19.0, 20.0, 31.0, 24.0, 37.0, 39.0, 36.0, 40.0, 45.0, 63.0, 63.0, 47.0, 64.0, 42.0, 52.0, 44.0, 25.0, 35.0, 32.0, 29.0, 28.0, 20.0, 19.0, 14.0, 4.0, 11.0, 6.0, 11.0, 6.0, 3.0, 4.0, 7.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.40625, -0.3944587707519531, -0.38266754150390625, -0.3708763122558594, -0.3590850830078125, -0.3472938537597656, -0.33550262451171875, -0.3237113952636719, -0.311920166015625, -0.3001289367675781, -0.28833770751953125, -0.2765464782714844, -0.2647552490234375, -0.2529640197753906, -0.24117279052734375, -0.22938156127929688, -0.21759033203125, -0.20579910278320312, -0.19400787353515625, -0.18221664428710938, -0.1704254150390625, -0.15863418579101562, -0.14684295654296875, -0.13505172729492188, -0.123260498046875, -0.11146926879882812, -0.09967803955078125, -0.08788681030273438, -0.0760955810546875, -0.06430435180664062, -0.05251312255859375, -0.040721893310546875, -0.0289306640625, -0.017139434814453125, -0.00534820556640625, 0.006443023681640625, 0.0182342529296875, 0.030025482177734375, 0.04181671142578125, 0.053607940673828125, 0.065399169921875, 0.07719039916992188, 0.08898162841796875, 0.10077285766601562, 0.1125640869140625, 0.12435531616210938, 0.13614654541015625, 0.14793777465820312, 0.15972900390625, 0.17152023315429688, 0.18331146240234375, 0.19510269165039062, 0.2068939208984375, 0.21868515014648438, 0.23047637939453125, 0.24226760864257812, 0.254058837890625, 0.2658500671386719, 0.27764129638671875, 0.2894325256347656, 0.3012237548828125, 0.3130149841308594, 0.32480621337890625, 0.3365974426269531, 0.348388671875]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 12.0, 8.0, 17.0, 22.0, 40.0, 51.0, 93.0, 141.0, 255.0, 507.0, 975.0, 1999.0, 4392.0, 10123.0, 24216.0, 59692.0, 144641.0, 348966.0, 254012.0, 116330.0, 47639.0, 19250.0, 8111.0, 3571.0, 1680.0, 822.0, 430.0, 231.0, 135.0, 78.0, 42.0, 20.0, 16.0, 14.0, 7.0, 10.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06207275390625, -0.06012535095214844, -0.058177947998046875, -0.05623054504394531, -0.05428314208984375, -0.05233573913574219, -0.050388336181640625, -0.04844093322753906, -0.0464935302734375, -0.04454612731933594, -0.042598724365234375, -0.04065132141113281, -0.03870391845703125, -0.03675651550292969, -0.034809112548828125, -0.03286170959472656, -0.030914306640625, -0.028966903686523438, -0.027019500732421875, -0.025072097778320312, -0.02312469482421875, -0.021177291870117188, -0.019229888916015625, -0.017282485961914062, -0.0153350830078125, -0.013387680053710938, -0.011440277099609375, -0.009492874145507812, -0.00754547119140625, -0.0055980682373046875, -0.003650665283203125, -0.0017032623291015625, 0.000244140625, 0.0021915435791015625, 0.004138946533203125, 0.0060863494873046875, 0.00803375244140625, 0.009981155395507812, 0.011928558349609375, 0.013875961303710938, 0.0158233642578125, 0.017770767211914062, 0.019718170166015625, 0.021665573120117188, 0.02361297607421875, 0.025560379028320312, 0.027507781982421875, 0.029455184936523438, 0.031402587890625, 0.03334999084472656, 0.035297393798828125, 0.03724479675292969, 0.03919219970703125, 0.04113960266113281, 0.043087005615234375, 0.04503440856933594, 0.0469818115234375, 0.04892921447753906, 0.050876617431640625, 0.05282402038574219, 0.05477142333984375, 0.05671882629394531, 0.058666229248046875, 0.06061363220214844, 0.06256103515625]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 3.0, 3.0, 4.0, 5.0, 7.0, 2.0, 3.0, 11.0, 14.0, 13.0, 15.0, 18.0, 24.0, 18.0, 25.0, 24.0, 40.0, 43.0, 45.0, 51.0, 51.0, 83.0, 84.0, 62.0, 52.0, 64.0, 30.0, 34.0, 28.0, 22.0, 28.0, 19.0, 16.0, 15.0, 17.0, 4.0, 10.0, 2.0, 7.0, 2.0, 4.0, 4.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.808208465576172e-06, -7.482245564460754e-06, -7.156282663345337e-06, -6.8303197622299194e-06, -6.504356861114502e-06, -6.1783939599990845e-06, -5.852431058883667e-06, -5.5264681577682495e-06, -5.200505256652832e-06, -4.8745423555374146e-06, -4.548579454421997e-06, -4.22261655330658e-06, -3.896653652191162e-06, -3.5706907510757446e-06, -3.244727849960327e-06, -2.9187649488449097e-06, -2.592802047729492e-06, -2.2668391466140747e-06, -1.9408762454986572e-06, -1.6149133443832397e-06, -1.2889504432678223e-06, -9.629875421524048e-07, -6.370246410369873e-07, -3.110617399215698e-07, 1.4901161193847656e-08, 3.4086406230926514e-07, 6.668269634246826e-07, 9.927898645401e-07, 1.3187527656555176e-06, 1.644715666770935e-06, 1.9706785678863525e-06, 2.29664146900177e-06, 2.6226043701171875e-06, 2.948567271232605e-06, 3.2745301723480225e-06, 3.60049307346344e-06, 3.926455974578857e-06, 4.252418875694275e-06, 4.578381776809692e-06, 4.90434467792511e-06, 5.230307579040527e-06, 5.556270480155945e-06, 5.882233381271362e-06, 6.20819628238678e-06, 6.534159183502197e-06, 6.860122084617615e-06, 7.186084985733032e-06, 7.51204788684845e-06, 7.838010787963867e-06, 8.163973689079285e-06, 8.489936590194702e-06, 8.81589949131012e-06, 9.141862392425537e-06, 9.467825293540955e-06, 9.793788194656372e-06, 1.011975109577179e-05, 1.0445713996887207e-05, 1.0771676898002625e-05, 1.1097639799118042e-05, 1.142360270023346e-05, 1.1749565601348877e-05, 1.2075528502464294e-05, 1.2401491403579712e-05, 1.272745430469513e-05, 1.3053417205810547e-05]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 4.0, 0.0, 9.0, 13.0, 19.0, 30.0, 36.0, 61.0, 92.0, 149.0, 209.0, 329.0, 501.0, 788.0, 1370.0, 2575.0, 5066.0, 11787.0, 33178.0, 101673.0, 277720.0, 398611.0, 139584.0, 45362.0, 15815.0, 6401.0, 3037.0, 1579.0, 965.0, 538.0, 367.0, 243.0, 154.0, 104.0, 71.0, 44.0, 27.0, 15.0, 16.0, 7.0, 6.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.08099365234375, -0.07839298248291016, -0.07579231262207031, -0.07319164276123047, -0.07059097290039062, -0.06799030303955078, -0.06538963317871094, -0.0627889633178711, -0.06018829345703125, -0.057587623596191406, -0.05498695373535156, -0.05238628387451172, -0.049785614013671875, -0.04718494415283203, -0.04458427429199219, -0.041983604431152344, -0.0393829345703125, -0.036782264709472656, -0.03418159484863281, -0.03158092498779297, -0.028980255126953125, -0.02637958526611328, -0.023778915405273438, -0.021178245544433594, -0.01857757568359375, -0.015976905822753906, -0.013376235961914062, -0.010775566101074219, -0.008174896240234375, -0.005574226379394531, -0.0029735565185546875, -0.00037288665771484375, 0.002227783203125, 0.004828453063964844, 0.0074291229248046875, 0.010029792785644531, 0.012630462646484375, 0.015231132507324219, 0.017831802368164062, 0.020432472229003906, 0.02303314208984375, 0.025633811950683594, 0.028234481811523438, 0.03083515167236328, 0.033435821533203125, 0.03603649139404297, 0.03863716125488281, 0.041237831115722656, 0.0438385009765625, 0.046439170837402344, 0.04903984069824219, 0.05164051055908203, 0.054241180419921875, 0.05684185028076172, 0.05944252014160156, 0.062043190002441406, 0.06464385986328125, 0.0672445297241211, 0.06984519958496094, 0.07244586944580078, 0.07504653930664062, 0.07764720916748047, 0.08024787902832031, 0.08284854888916016, 0.08544921875]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 4.0, 4.0, 6.0, 4.0, 8.0, 7.0, 17.0, 22.0, 50.0, 64.0, 120.0, 136.0, 234.0, 102.0, 78.0, 49.0, 34.0, 19.0, 12.0, 14.0, 4.0, 5.0, 2.0, 1.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10595703125, -0.10302448272705078, -0.10009193420410156, -0.09715938568115234, -0.09422683715820312, -0.0912942886352539, -0.08836174011230469, -0.08542919158935547, -0.08249664306640625, -0.07956409454345703, -0.07663154602050781, -0.0736989974975586, -0.07076644897460938, -0.06783390045166016, -0.06490135192871094, -0.06196880340576172, -0.0590362548828125, -0.05610370635986328, -0.05317115783691406, -0.050238609313964844, -0.047306060791015625, -0.044373512268066406, -0.04144096374511719, -0.03850841522216797, -0.03557586669921875, -0.03264331817626953, -0.029710769653320312, -0.026778221130371094, -0.023845672607421875, -0.020913124084472656, -0.017980575561523438, -0.015048027038574219, -0.012115478515625, -0.009182929992675781, -0.0062503814697265625, -0.0033178329467773438, -0.000385284423828125, 0.0025472640991210938, 0.0054798126220703125, 0.008412361145019531, 0.01134490966796875, 0.014277458190917969, 0.017210006713867188, 0.020142555236816406, 0.023075103759765625, 0.026007652282714844, 0.028940200805664062, 0.03187274932861328, 0.0348052978515625, 0.03773784637451172, 0.04067039489746094, 0.043602943420410156, 0.046535491943359375, 0.049468040466308594, 0.05240058898925781, 0.05533313751220703, 0.05826568603515625, 0.06119823455810547, 0.06413078308105469, 0.0670633316040039, 0.06999588012695312, 0.07292842864990234, 0.07586097717285156, 0.07879352569580078, 0.08172607421875]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 3.0, 1.0, 4.0, 2.0, 5.0, 10.0, 12.0, 21.0, 29.0, 42.0, 46.0, 64.0, 75.0, 85.0, 107.0, 115.0, 83.0, 66.0, 64.0, 45.0, 41.0, 31.0, 26.0, 9.0, 9.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8088246583938599, -0.7880679368972778, -0.7673112154006958, -0.7465544939041138, -0.7257977724075317, -0.7050409913063049, -0.6842842698097229, -0.6635275483131409, -0.6427708268165588, -0.6220141053199768, -0.6012573838233948, -0.5805006623268127, -0.5597438812255859, -0.5389871597290039, -0.5182304382324219, -0.49747371673583984, -0.4767169952392578, -0.4559602737426758, -0.43520355224609375, -0.41444680094718933, -0.3936900794506073, -0.37293335795402527, -0.35217660665512085, -0.3314198851585388, -0.3106631636619568, -0.28990644216537476, -0.2691497206687927, -0.2483929693698883, -0.22763624787330627, -0.20687952637672424, -0.18612278997898102, -0.1653660535812378, -0.14460933208465576, -0.12385260313749313, -0.1030958741903305, -0.08233914524316788, -0.06158241629600525, -0.04082568734884262, -0.020068958401679993, 0.0006877779960632324, 0.021444499492645264, 0.04220122843980789, 0.06295795738697052, 0.08371468633413315, 0.10447141528129578, 0.1252281367778778, 0.14598487317562103, 0.16674160957336426, 0.1874983310699463, 0.20825505256652832, 0.22901178896427155, 0.24976852536201477, 0.2705252468585968, 0.29128196835517883, 0.31203871965408325, 0.3327954411506653, 0.3535521626472473, 0.37430888414382935, 0.3950656056404114, 0.4158223569393158, 0.4365790784358978, 0.45733579993247986, 0.4780925512313843, 0.4988492727279663, 0.5196059942245483]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 3.0, 0.0, 6.0, 5.0, 7.0, 11.0, 12.0, 8.0, 10.0, 10.0, 10.0, 21.0, 17.0, 22.0, 25.0, 30.0, 25.0, 24.0, 33.0, 32.0, 36.0, 46.0, 47.0, 36.0, 33.0, 40.0, 36.0, 40.0, 36.0, 44.0, 41.0, 26.0, 28.0, 31.0, 24.0, 15.0, 17.0, 20.0, 20.0, 15.0, 9.0, 13.0, 9.0, 5.0, 7.0, 6.0, 2.0, 1.0, 6.0, 5.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.5575844049453735, -0.5409726500511169, -0.5243608951568604, -0.5077491402626038, -0.49113738536834717, -0.4745256304740906, -0.45791390538215637, -0.4413021504878998, -0.4246903955936432, -0.4080786406993866, -0.39146688580513, -0.3748551309108734, -0.3582434058189392, -0.3416316509246826, -0.325019896030426, -0.30840814113616943, -0.29179638624191284, -0.27518463134765625, -0.25857287645339966, -0.24196113646030426, -0.22534938156604767, -0.20873762667179108, -0.19212588667869568, -0.1755141317844391, -0.1589023768901825, -0.1422906219959259, -0.1256788671016693, -0.10906712710857391, -0.09245537221431732, -0.07584361732006073, -0.059231869876384735, -0.04262012243270874, -0.02600836753845215, -0.009396616369485855, 0.007215134799480438, 0.02382688596844673, 0.040438637137413025, 0.05705039203166962, 0.07366213947534561, 0.0902738869190216, 0.1068856418132782, 0.12349739670753479, 0.14010915160179138, 0.15672089159488678, 0.17333264648914337, 0.18994440138339996, 0.20655614137649536, 0.22316789627075195, 0.23977965116500854, 0.25639140605926514, 0.27300316095352173, 0.2896149158477783, 0.3062266707420349, 0.3228384256362915, 0.3394501507282257, 0.3560619056224823, 0.3726736605167389, 0.3892854154109955, 0.4058971703052521, 0.42250892519950867, 0.43912065029144287, 0.45573240518569946, 0.47234416007995605, 0.48895591497421265, 0.5055676698684692]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 5.0, 10.0, 14.0, 15.0, 18.0, 31.0, 43.0, 44.0, 64.0, 122.0, 154.0, 225.0, 372.0, 496.0, 684.0, 1004.0, 1492.0, 2347.0, 3762.0, 6234.0, 1009596.0, 8782.0, 5288.0, 3295.0, 2125.0, 1369.0, 980.0, 635.0, 418.0, 294.0, 218.0, 153.0, 93.0, 76.0, 48.0, 28.0, 20.0, 14.0, 9.0, 12.0, 6.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5183072090148926, -0.5015133023262024, -0.4847193956375122, -0.467925488948822, -0.45113155245780945, -0.43433764576911926, -0.4175437390804291, -0.4007498323917389, -0.3839558959007263, -0.36716198921203613, -0.35036808252334595, -0.33357417583465576, -0.3167802393436432, -0.299986332654953, -0.2831924259662628, -0.26639851927757263, -0.24960461258888245, -0.23281070590019226, -0.21601678431034088, -0.1992228776216507, -0.18242895603179932, -0.16563504934310913, -0.14884114265441895, -0.13204723596572876, -0.11525331437587738, -0.0984594002366066, -0.08166548609733582, -0.06487157940864563, -0.04807766526937485, -0.031283751130104065, -0.01448984444141388, 0.002304069697856903, 0.019097983837127686, 0.03589189797639847, 0.05268580839037895, 0.06947971880435944, 0.08627363294363022, 0.103067547082901, 0.11986145377159119, 0.13665536046028137, 0.15344928205013275, 0.17024318873882294, 0.18703711032867432, 0.2038310170173645, 0.2206249237060547, 0.23741884529590607, 0.25421273708343506, 0.27100667357444763, 0.2878005802631378, 0.304594486951828, 0.3213883936405182, 0.33818233013153076, 0.35497623682022095, 0.37177014350891113, 0.3885640501976013, 0.4053579568862915, 0.4221518635749817, 0.4389457702636719, 0.45573967695236206, 0.47253358364105225, 0.4893275201320648, 0.5061213970184326, 0.5229153633117676, 0.5397092700004578, 0.556503176689148]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 8.0, 6.0, 10.0, 21.0, 39.0, 54.0, 81.0, 202.0, 346.0, 632.0, 1153.0, 2073.0, 4051.0, 10658.0, 51404888.0, 33277.0, 6109.0, 3075.0, 1605.0, 892.0, 490.0, 281.0, 167.0, 86.0, 44.0, 31.0, 18.0, 14.0, 9.0, 5.0, 1.0, 3.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.65234375, -5.455806255340576, -5.259268760681152, -5.06273078918457, -4.8661932945251465, -4.669655799865723, -4.473118305206299, -4.276580810546875, -4.080043315887451, -3.8835058212280273, -3.6869680881500244, -3.4904305934906006, -3.2938930988311768, -3.097355365753174, -2.90081787109375, -2.704280376434326, -2.5077426433563232, -2.3112051486968994, -2.1146674156188965, -1.9181299209594727, -1.7215924263000488, -1.5250548124313354, -1.328517198562622, -1.1319797039031982, -0.9354420900344849, -0.7389045357704163, -0.5423669815063477, -0.3458293676376343, -0.14929181337356567, 0.04724574089050293, 0.2437833547592163, 0.44032084941864014, 0.6368584632873535, 0.8333960175514221, 1.0299335718154907, 1.226471185684204, 1.423008680343628, 1.6195462942123413, 1.8160839080810547, 2.0126214027404785, 2.2091588973999023, 2.405696392059326, 2.602234125137329, 2.798771619796753, 2.9953091144561768, 3.1918468475341797, 3.3883843421936035, 3.5849218368530273, 3.7814595699310303, 3.977997064590454, 4.174534797668457, 4.371072292327881, 4.567609786987305, 4.7641472816467285, 4.960684776306152, 5.157222747802734, 5.353760242462158, 5.550297737121582, 5.746835231781006, 5.94337272644043, 6.139910697937012, 6.3364481925964355, 6.532985687255859, 6.729523181915283, 6.926060676574707]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 6.0, 6.0, 11.0, 12.0, 16.0, 34.0, 60.0, 88.0, 157.0, 257.0, 360.0, 673.0, 994.0, 1613.0, 2744.0, 4405.0, 7380.0, 12715.0, 21183.0, 36544.0, 61043.0, 101888.0, 160428.0, 236500.0, 324469.0, 531979.0, 3229397.0, 565899.0, 329037.0, 240176.0, 163671.0, 103322.0, 63526.0, 37204.0, 21588.0, 13079.0, 7506.0, 4574.0, 2702.0, 1595.0, 1049.0, 617.0, 379.0, 207.0, 126.0, 89.0, 52.0, 39.0, 17.0, 15.0, 6.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.54833984375, -0.53094482421875, -0.5135498046875, -0.49615478515625, -0.478759765625, -0.46136474609375, -0.4439697265625, -0.42657470703125, -0.4091796875, -0.39178466796875, -0.3743896484375, -0.35699462890625, -0.339599609375, -0.32220458984375, -0.3048095703125, -0.28741455078125, -0.27001953125, -0.25262451171875, -0.2352294921875, -0.21783447265625, -0.200439453125, -0.18304443359375, -0.1656494140625, -0.14825439453125, -0.130859375, -0.11346435546875, -0.0960693359375, -0.07867431640625, -0.061279296875, -0.04388427734375, -0.0264892578125, -0.00909423828125, 0.00830078125, 0.02569580078125, 0.0430908203125, 0.06048583984375, 0.077880859375, 0.09527587890625, 0.1126708984375, 0.13006591796875, 0.1474609375, 0.16485595703125, 0.1822509765625, 0.19964599609375, 0.217041015625, 0.23443603515625, 0.2518310546875, 0.26922607421875, 0.28662109375, 0.30401611328125, 0.3214111328125, 0.33880615234375, 0.356201171875, 0.37359619140625, 0.3909912109375, 0.40838623046875, 0.42578125, 0.44317626953125, 0.4605712890625, 0.47796630859375, 0.495361328125, 0.51275634765625, 0.5301513671875, 0.54754638671875, 0.56494140625]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 4.0, 1.0, 4.0, 6.0, 1.0, 8.0, 7.0, 12.0, 12.0, 16.0, 16.0, 17.0, 33.0, 27.0, 33.0, 39.0, 59.0, 44.0, 50.0, 45.0, 117.0, 798.0, 253.0, 63.0, 51.0, 54.0, 45.0, 29.0, 40.0, 23.0, 22.0, 23.0, 19.0, 25.0, 6.0, 7.0, 7.0, 8.0, 6.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.44140625, -4.28680419921875, -4.1322021484375, -3.97760009765625, -3.822998046875, -3.66839599609375, -3.5137939453125, -3.35919189453125, -3.20458984375, -3.04998779296875, -2.8953857421875, -2.74078369140625, -2.586181640625, -2.43157958984375, -2.2769775390625, -2.12237548828125, -1.9677734375, -1.81317138671875, -1.6585693359375, -1.50396728515625, -1.349365234375, -1.19476318359375, -1.0401611328125, -0.88555908203125, -0.73095703125, -0.57635498046875, -0.4217529296875, -0.26715087890625, -0.112548828125, 0.04205322265625, 0.1966552734375, 0.35125732421875, 0.505859375, 0.66046142578125, 0.8150634765625, 0.96966552734375, 1.124267578125, 1.27886962890625, 1.4334716796875, 1.58807373046875, 1.74267578125, 1.89727783203125, 2.0518798828125, 2.20648193359375, 2.361083984375, 2.51568603515625, 2.6702880859375, 2.82489013671875, 2.9794921875, 3.13409423828125, 3.2886962890625, 3.44329833984375, 3.597900390625, 3.75250244140625, 3.9071044921875, 4.06170654296875, 4.21630859375, 4.37091064453125, 4.5255126953125, 4.68011474609375, 4.834716796875, 4.98931884765625, 5.1439208984375, 5.29852294921875, 5.453125]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 5.0, 7.0, 18.0, 26.0, 31.0, 78.0, 143.0, 283.0, 481.0, 857.0, 1616.0, 2745.0, 4801.0, 8220.0, 13815.0, 22881.0, 36162.0, 55233.0, 83053.0, 118733.0, 161470.0, 210079.0, 256878.0, 306615.0, 2030191.0, 1724125.0, 299246.0, 251881.0, 205778.0, 158386.0, 115020.0, 80411.0, 53732.0, 34704.0, 21659.0, 13314.0, 7965.0, 4743.0, 2716.0, 1426.0, 842.0, 436.0, 272.0, 168.0, 99.0, 46.0, 27.0, 18.0, 8.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.302001953125, -0.2912025451660156, -0.28040313720703125, -0.2696037292480469, -0.2588043212890625, -0.24800491333007812, -0.23720550537109375, -0.22640609741210938, -0.215606689453125, -0.20480728149414062, -0.19400787353515625, -0.18320846557617188, -0.1724090576171875, -0.16160964965820312, -0.15081024169921875, -0.14001083374023438, -0.12921142578125, -0.11841201782226562, -0.10761260986328125, -0.09681320190429688, -0.0860137939453125, -0.07521438598632812, -0.06441497802734375, -0.053615570068359375, -0.042816162109375, -0.032016754150390625, -0.02121734619140625, -0.010417938232421875, 0.0003814697265625, 0.011180877685546875, 0.02198028564453125, 0.032779693603515625, 0.0435791015625, 0.054378509521484375, 0.06517791748046875, 0.07597732543945312, 0.0867767333984375, 0.09757614135742188, 0.10837554931640625, 0.11917495727539062, 0.129974365234375, 0.14077377319335938, 0.15157318115234375, 0.16237258911132812, 0.1731719970703125, 0.18397140502929688, 0.19477081298828125, 0.20557022094726562, 0.21636962890625, 0.22716903686523438, 0.23796844482421875, 0.24876785278320312, 0.2595672607421875, 0.2703666687011719, 0.28116607666015625, 0.2919654846191406, 0.302764892578125, 0.3135643005371094, 0.32436370849609375, 0.3351631164550781, 0.3459625244140625, 0.3567619323730469, 0.36756134033203125, 0.3783607482910156, 0.38916015625]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 7.0, 3.0, 8.0, 1.0, 7.0, 10.0, 10.0, 8.0, 11.0, 14.0, 23.0, 15.0, 25.0, 23.0, 26.0, 33.0, 43.0, 36.0, 31.0, 42.0, 31.0, 39.0, 65.0, 499.0, 537.0, 54.0, 31.0, 33.0, 36.0, 29.0, 23.0, 27.0, 30.0, 26.0, 18.0, 25.0, 24.0, 19.0, 13.0, 19.0, 13.0, 16.0, 7.0, 8.0, 9.0, 7.0, 6.0, 2.0, 4.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.140625, -3.042633056640625, -2.94464111328125, -2.846649169921875, -2.7486572265625, -2.650665283203125, -2.55267333984375, -2.454681396484375, -2.356689453125, -2.258697509765625, -2.16070556640625, -2.062713623046875, -1.9647216796875, -1.866729736328125, -1.76873779296875, -1.670745849609375, -1.57275390625, -1.474761962890625, -1.37677001953125, -1.278778076171875, -1.1807861328125, -1.082794189453125, -0.98480224609375, -0.886810302734375, -0.788818359375, -0.690826416015625, -0.59283447265625, -0.494842529296875, -0.3968505859375, -0.298858642578125, -0.20086669921875, -0.102874755859375, -0.0048828125, 0.093109130859375, 0.19110107421875, 0.289093017578125, 0.3870849609375, 0.485076904296875, 0.58306884765625, 0.681060791015625, 0.779052734375, 0.877044677734375, 0.97503662109375, 1.073028564453125, 1.1710205078125, 1.269012451171875, 1.36700439453125, 1.464996337890625, 1.56298828125, 1.660980224609375, 1.75897216796875, 1.856964111328125, 1.9549560546875, 2.052947998046875, 2.15093994140625, 2.248931884765625, 2.346923828125, 2.444915771484375, 2.54290771484375, 2.640899658203125, 2.7388916015625, 2.836883544921875, 2.93487548828125, 3.032867431640625, 3.130859375]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 4.0, 1.0, 3.0, 5.0, 12.0, 17.0, 19.0, 29.0, 36.0, 61.0, 66.0, 99.0, 135.0, 211.0, 264.0, 363.0, 573.0, 798.0, 1238.0, 2014.0, 3645.0, 7434.0, 17970.0, 46947.0, 112513.0, 4123134.0, 1780856.0, 112205.0, 46100.0, 17823.0, 7366.0, 3538.0, 1976.0, 1278.0, 779.0, 542.0, 362.0, 271.0, 220.0, 159.0, 101.0, 80.0, 58.0, 37.0, 35.0, 18.0, 12.0, 14.0, 8.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.5537109375, -1.5001220703125, -1.446533203125, -1.3929443359375, -1.33935546875, -1.2857666015625, -1.232177734375, -1.1785888671875, -1.125, -1.0714111328125, -1.017822265625, -0.9642333984375, -0.91064453125, -0.8570556640625, -0.803466796875, -0.7498779296875, -0.6962890625, -0.6427001953125, -0.589111328125, -0.5355224609375, -0.48193359375, -0.4283447265625, -0.374755859375, -0.3211669921875, -0.267578125, -0.2139892578125, -0.160400390625, -0.1068115234375, -0.05322265625, 0.0003662109375, 0.053955078125, 0.1075439453125, 0.1611328125, 0.2147216796875, 0.268310546875, 0.3218994140625, 0.37548828125, 0.4290771484375, 0.482666015625, 0.5362548828125, 0.58984375, 0.6434326171875, 0.697021484375, 0.7506103515625, 0.80419921875, 0.8577880859375, 0.911376953125, 0.9649658203125, 1.0185546875, 1.0721435546875, 1.125732421875, 1.1793212890625, 1.23291015625, 1.2864990234375, 1.340087890625, 1.3936767578125, 1.447265625, 1.5008544921875, 1.554443359375, 1.6080322265625, 1.66162109375, 1.7152099609375, 1.768798828125, 1.8223876953125, 1.8759765625]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 6.0, 0.0, 2.0, 5.0, 7.0, 5.0, 10.0, 8.0, 6.0, 20.0, 20.0, 22.0, 24.0, 18.0, 31.0, 29.0, 32.0, 45.0, 45.0, 34.0, 49.0, 102.0, 841.0, 206.0, 54.0, 46.0, 28.0, 40.0, 42.0, 38.0, 22.0, 35.0, 23.0, 19.0, 25.0, 14.0, 10.0, 10.0, 16.0, 7.0, 8.0, 12.0, 5.0, 2.0, 4.0, 1.0, 3.0, 3.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.53125, -3.41607666015625, -3.3009033203125, -3.18572998046875, -3.070556640625, -2.95538330078125, -2.8402099609375, -2.72503662109375, -2.60986328125, -2.49468994140625, -2.3795166015625, -2.26434326171875, -2.149169921875, -2.03399658203125, -1.9188232421875, -1.80364990234375, -1.6884765625, -1.57330322265625, -1.4581298828125, -1.34295654296875, -1.227783203125, -1.11260986328125, -0.9974365234375, -0.88226318359375, -0.76708984375, -0.65191650390625, -0.5367431640625, -0.42156982421875, -0.306396484375, -0.19122314453125, -0.0760498046875, 0.03912353515625, 0.154296875, 0.26947021484375, 0.3846435546875, 0.49981689453125, 0.614990234375, 0.73016357421875, 0.8453369140625, 0.96051025390625, 1.07568359375, 1.19085693359375, 1.3060302734375, 1.42120361328125, 1.536376953125, 1.65155029296875, 1.7667236328125, 1.88189697265625, 1.9970703125, 2.11224365234375, 2.2274169921875, 2.34259033203125, 2.457763671875, 2.57293701171875, 2.6881103515625, 2.80328369140625, 2.91845703125, 3.03363037109375, 3.1488037109375, 3.26397705078125, 3.379150390625, 3.49432373046875, 3.6094970703125, 3.72467041015625, 3.83984375]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 4.0, 4.0, 2.0, 7.0, 8.0, 9.0, 24.0, 36.0, 59.0, 96.0, 140.0, 203.0, 152.0, 80.0, 70.0, 42.0, 25.0, 19.0, 9.0, 2.0, 6.0, 2.0, 3.0, 1.0, 7.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.538033485412598, -11.14929485321045, -10.760555267333984, -10.371816635131836, -9.983078002929688, -9.594338417053223, -9.205599784851074, -8.81686019897461, -8.428121566772461, -8.039382934570312, -7.650643348693848, -7.261904716491699, -6.873165607452393, -6.484426498413086, -6.0956878662109375, -5.706948757171631, -5.318209648132324, -4.929470539093018, -4.540731430053711, -4.1519927978515625, -3.763253688812256, -3.374514579772949, -2.9857757091522217, -2.597036838531494, -2.2082977294921875, -1.8195587396621704, -1.4308197498321533, -1.0420807600021362, -0.6533417701721191, -0.26460278034210205, 0.12413620948791504, 0.5128750801086426, 0.9016132354736328, 1.29035222530365, 1.679091215133667, 2.0678300857543945, 2.456569194793701, 2.845308303833008, 3.2340471744537354, 3.622786045074463, 4.0115251541137695, 4.400264263153076, 4.789003372192383, 5.177742004394531, 5.566481113433838, 5.9552202224731445, 6.343958854675293, 6.7326979637146, 7.121437072753906, 7.510176181793213, 7.8989152908325195, 8.287653923034668, 8.676393508911133, 9.065132141113281, 9.45387077331543, 9.842609405517578, 10.231348991394043, 10.620087623596191, 11.008827209472656, 11.397565841674805, 11.786304473876953, 12.175044059753418, 12.563782691955566, 12.952522277832031, 13.34126091003418]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 7.0, 5.0, 7.0, 9.0, 7.0, 17.0, 9.0, 15.0, 24.0, 31.0, 23.0, 47.0, 53.0, 67.0, 53.0, 92.0, 94.0, 75.0, 69.0, 60.0, 47.0, 34.0, 35.0, 26.0, 28.0, 15.0, 19.0, 10.0, 4.0, 7.0, 7.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.305809020996094, -15.819100379943848, -15.332390785217285, -14.845682144165039, -14.358972549438477, -13.87226390838623, -13.385554313659668, -12.898845672607422, -12.41213607788086, -11.925427436828613, -11.43871784210205, -10.952009201049805, -10.465299606323242, -9.978590965270996, -9.491881370544434, -9.005172729492188, -8.518463134765625, -8.031754493713379, -7.545044898986816, -7.058335781097412, -6.571626663208008, -6.084918022155762, -5.598208427429199, -5.111499786376953, -4.624791145324707, -4.138082027435303, -3.6513729095458984, -3.164663791656494, -2.67795467376709, -2.1912457942962646, -1.7045366764068604, -1.217827558517456, -0.7311182022094727, -0.24440911412239075, 0.24229997396469116, 0.7290090322494507, 1.215718150138855, 1.7024271488189697, 2.189136266708374, 2.6758453845977783, 3.1625545024871826, 3.649263620376587, 4.135972499847412, 4.622681617736816, 5.109390735626221, 5.596099853515625, 6.082808971405029, 6.569518089294434, 7.056227207183838, 7.542936325073242, 8.029644966125488, 8.51635456085205, 9.003063201904297, 9.48977279663086, 9.976481437683105, 10.463191032409668, 10.949899673461914, 11.43660831451416, 11.923317909240723, 12.410026550292969, 12.896736145019531, 13.383444786071777, 13.87015438079834, 14.356863021850586, 14.843572616577148]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 7.0, 10.0, 9.0, 17.0, 27.0, 41.0, 66.0, 93.0, 137.0, 250.0, 440.0, 716.0, 1421.0, 2811.0, 6276.0, 16505.0, 58716.0, 3716206.0, 322403.0, 41411.0, 14089.0, 6034.0, 2864.0, 1519.0, 855.0, 500.0, 295.0, 193.0, 131.0, 73.0, 46.0, 44.0, 20.0, 19.0, 13.0, 9.0, 4.0, 6.0, 6.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1336669921875, -0.1294708251953125, -0.125274658203125, -0.1210784912109375, -0.11688232421875, -0.1126861572265625, -0.108489990234375, -0.1042938232421875, -0.10009765625, -0.0959014892578125, -0.091705322265625, -0.0875091552734375, -0.08331298828125, -0.0791168212890625, -0.074920654296875, -0.0707244873046875, -0.0665283203125, -0.0623321533203125, -0.058135986328125, -0.0539398193359375, -0.04974365234375, -0.0455474853515625, -0.041351318359375, -0.0371551513671875, -0.032958984375, -0.0287628173828125, -0.024566650390625, -0.0203704833984375, -0.01617431640625, -0.0119781494140625, -0.007781982421875, -0.0035858154296875, 0.0006103515625, 0.0048065185546875, 0.009002685546875, 0.0131988525390625, 0.01739501953125, 0.0215911865234375, 0.025787353515625, 0.0299835205078125, 0.0341796875, 0.0383758544921875, 0.042572021484375, 0.0467681884765625, 0.05096435546875, 0.0551605224609375, 0.059356689453125, 0.0635528564453125, 0.0677490234375, 0.0719451904296875, 0.076141357421875, 0.0803375244140625, 0.08453369140625, 0.0887298583984375, 0.092926025390625, 0.0971221923828125, 0.101318359375, 0.1055145263671875, 0.109710693359375, 0.1139068603515625, 0.11810302734375, 0.1222991943359375, 0.126495361328125, 0.1306915283203125, 0.1348876953125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 9.0, 4.0, 2.0, 9.0, 4.0, 6.0, 8.0, 14.0, 11.0, 11.0, 24.0, 49.0, 259.0, 395.0, 55.0, 21.0, 15.0, 21.0, 9.0, 8.0, 10.0, 6.0, 7.0, 4.0, 4.0, 5.0, 5.0, 1.0, 6.0, 3.0, 5.0, 3.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.033050537109375, -0.03179597854614258, -0.030541419982910156, -0.029286861419677734, -0.028032302856445312, -0.02677774429321289, -0.02552318572998047, -0.024268627166748047, -0.023014068603515625, -0.021759510040283203, -0.02050495147705078, -0.01925039291381836, -0.017995834350585938, -0.016741275787353516, -0.015486717224121094, -0.014232158660888672, -0.01297760009765625, -0.011723041534423828, -0.010468482971191406, -0.009213924407958984, -0.007959365844726562, -0.006704807281494141, -0.005450248718261719, -0.004195690155029297, -0.002941131591796875, -0.0016865730285644531, -0.00043201446533203125, 0.0008225440979003906, 0.0020771026611328125, 0.0033316612243652344, 0.004586219787597656, 0.005840778350830078, 0.0070953369140625, 0.008349895477294922, 0.009604454040527344, 0.010859012603759766, 0.012113571166992188, 0.01336812973022461, 0.014622688293457031, 0.015877246856689453, 0.017131805419921875, 0.018386363983154297, 0.01964092254638672, 0.02089548110961914, 0.022150039672851562, 0.023404598236083984, 0.024659156799316406, 0.025913715362548828, 0.02716827392578125, 0.028422832489013672, 0.029677391052246094, 0.030931949615478516, 0.03218650817871094, 0.03344106674194336, 0.03469562530517578, 0.0359501838684082, 0.037204742431640625, 0.03845930099487305, 0.03971385955810547, 0.04096841812133789, 0.04222297668457031, 0.043477535247802734, 0.044732093811035156, 0.04598665237426758, 0.0472412109375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 4.0, 1.0, 3.0, 4.0, 6.0, 6.0, 6.0, 11.0, 16.0, 16.0, 16.0, 24.0, 35.0, 46.0, 67.0, 104.0, 159.0, 234.0, 385.0, 743.0, 1473.0, 3436.0, 8370.0, 22526.0, 67283.0, 247533.0, 1545534.0, 1902663.0, 279091.0, 73924.0, 24199.0, 8961.0, 3777.0, 1650.0, 792.0, 424.0, 212.0, 170.0, 93.0, 64.0, 48.0, 48.0, 32.0, 22.0, 16.0, 16.0, 13.0, 10.0, 9.0, 4.0, 5.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 3.0], "bins": [-0.08154296875, -0.07907485961914062, -0.07660675048828125, -0.07413864135742188, -0.0716705322265625, -0.06920242309570312, -0.06673431396484375, -0.06426620483398438, -0.061798095703125, -0.059329986572265625, -0.05686187744140625, -0.054393768310546875, -0.0519256591796875, -0.049457550048828125, -0.04698944091796875, -0.044521331787109375, -0.04205322265625, -0.039585113525390625, -0.03711700439453125, -0.034648895263671875, -0.0321807861328125, -0.029712677001953125, -0.02724456787109375, -0.024776458740234375, -0.022308349609375, -0.019840240478515625, -0.01737213134765625, -0.014904022216796875, -0.0124359130859375, -0.009967803955078125, -0.00749969482421875, -0.005031585693359375, -0.0025634765625, -9.5367431640625e-05, 0.00237274169921875, 0.004840850830078125, 0.0073089599609375, 0.009777069091796875, 0.01224517822265625, 0.014713287353515625, 0.017181396484375, 0.019649505615234375, 0.02211761474609375, 0.024585723876953125, 0.0270538330078125, 0.029521942138671875, 0.03199005126953125, 0.034458160400390625, 0.03692626953125, 0.039394378662109375, 0.04186248779296875, 0.044330596923828125, 0.0467987060546875, 0.049266815185546875, 0.05173492431640625, 0.054203033447265625, 0.056671142578125, 0.059139251708984375, 0.06160736083984375, 0.06407546997070312, 0.0665435791015625, 0.06901168823242188, 0.07147979736328125, 0.07394790649414062, 0.076416015625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 6.0, 7.0, 12.0, 5.0, 8.0, 21.0, 16.0, 22.0, 27.0, 33.0, 39.0, 61.0, 79.0, 93.0, 136.0, 187.0, 275.0, 463.0, 824.0, 562.0, 357.0, 214.0, 159.0, 116.0, 78.0, 58.0, 33.0, 34.0, 35.0, 19.0, 21.0, 17.0, 13.0, 6.0, 9.0, 7.0, 7.0, 9.0, 5.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.029388427734375, -0.028324604034423828, -0.027260780334472656, -0.026196956634521484, -0.025133132934570312, -0.02406930923461914, -0.02300548553466797, -0.021941661834716797, -0.020877838134765625, -0.019814014434814453, -0.01875019073486328, -0.01768636703491211, -0.016622543334960938, -0.015558719635009766, -0.014494895935058594, -0.013431072235107422, -0.01236724853515625, -0.011303424835205078, -0.010239601135253906, -0.009175777435302734, -0.008111953735351562, -0.007048130035400391, -0.005984306335449219, -0.004920482635498047, -0.003856658935546875, -0.002792835235595703, -0.0017290115356445312, -0.0006651878356933594, 0.0003986358642578125, 0.0014624595642089844, 0.0025262832641601562, 0.003590106964111328, 0.0046539306640625, 0.005717754364013672, 0.006781578063964844, 0.007845401763916016, 0.008909225463867188, 0.00997304916381836, 0.011036872863769531, 0.012100696563720703, 0.013164520263671875, 0.014228343963623047, 0.015292167663574219, 0.01635599136352539, 0.017419815063476562, 0.018483638763427734, 0.019547462463378906, 0.020611286163330078, 0.02167510986328125, 0.022738933563232422, 0.023802757263183594, 0.024866580963134766, 0.025930404663085938, 0.02699422836303711, 0.02805805206298828, 0.029121875762939453, 0.030185699462890625, 0.031249523162841797, 0.03231334686279297, 0.03337717056274414, 0.03444099426269531, 0.035504817962646484, 0.036568641662597656, 0.03763246536254883, 0.0386962890625]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 7.0, 11.0, 46.0, 108.0, 195.0, 225.0, 197.0, 111.0, 66.0, 26.0, 6.0, 1.0, 1.0, 7.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.389734148979187, -0.3784733712673187, -0.36721259355545044, -0.35595181584358215, -0.34469103813171387, -0.3334302604198456, -0.3221694827079773, -0.3109087347984314, -0.2996479272842407, -0.28838714957237244, -0.27712637186050415, -0.26586559414863586, -0.2546048164367676, -0.2433440387248993, -0.2320832759141922, -0.2208224982023239, -0.20956173539161682, -0.19830095767974854, -0.18704017996788025, -0.17577940225601196, -0.16451862454414368, -0.1532578468322754, -0.1419970840215683, -0.1307363063097, -0.11947552859783173, -0.10821475088596344, -0.09695397317409515, -0.08569320291280746, -0.07443242520093918, -0.06317164748907089, -0.0519108772277832, -0.04065009951591492, -0.02938932180404663, -0.018128545954823494, -0.006867770105600357, 0.004393003880977631, 0.015653781592845917, 0.026914559304714203, 0.03817532956600189, 0.04943610727787018, 0.060696884989738464, 0.07195766270160675, 0.08321844041347504, 0.09447921067476273, 0.10573998838663101, 0.1170007660984993, 0.128261536359787, 0.13952231407165527, 0.15078309178352356, 0.16204386949539185, 0.17330464720726013, 0.18456542491912842, 0.1958262026309967, 0.207086980342865, 0.21834774315357208, 0.22960852086544037, 0.24086929857730865, 0.25213006138801575, 0.26339083909988403, 0.2746516168117523, 0.2859123945236206, 0.2971731722354889, 0.3084339499473572, 0.31969472765922546, 0.33095550537109375]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 2.0, 4.0, 14.0, 15.0, 33.0, 28.0, 34.0, 48.0, 59.0, 63.0, 72.0, 62.0, 74.0, 72.0, 64.0, 65.0, 53.0, 63.0, 45.0, 32.0, 24.0, 20.0, 16.0, 11.0, 5.0, 2.0, 6.0, 4.0, 8.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.3145880699157715, -0.30716803669929504, -0.2997480034828186, -0.29232797026634216, -0.2849079370498657, -0.27748793363571167, -0.27006787061691284, -0.2626478672027588, -0.25522783398628235, -0.2478078007698059, -0.24038776755332947, -0.23296773433685303, -0.22554771602153778, -0.21812768280506134, -0.2107076495885849, -0.20328761637210846, -0.19586758315563202, -0.18844754993915558, -0.18102751672267914, -0.1736074984073639, -0.16618746519088745, -0.158767431974411, -0.15134739875793457, -0.14392736554145813, -0.1365073323249817, -0.12908729910850525, -0.1216672733426094, -0.11424724012613297, -0.10682721436023712, -0.09940718114376068, -0.09198714792728424, -0.0845671147108078, -0.07714709639549255, -0.06972706317901611, -0.06230703741312027, -0.05488700419664383, -0.04746697470545769, -0.040046945214271545, -0.032626911997795105, -0.025206882506608963, -0.01778685301542282, -0.010366822592914104, -0.002946792170405388, 0.004473239183425903, 0.011893268674612045, 0.019313298165798187, 0.026733331382274628, 0.03415336087346077, 0.04157339036464691, 0.048993419855833054, 0.056413449347019196, 0.06383348256349564, 0.07125350832939148, 0.07867354154586792, 0.08609357476234436, 0.0935136079788208, 0.10093363374471664, 0.10835366696119308, 0.11577369272708893, 0.12319372594356537, 0.1306137591600418, 0.13803377747535706, 0.1454538106918335, 0.15287384390830994, 0.16029387712478638]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 9.0, 9.0, 7.0, 12.0, 17.0, 37.0, 46.0, 79.0, 110.0, 149.0, 248.0, 383.0, 552.0, 896.0, 1377.0, 2228.0, 3383.0, 5525.0, 9189.0, 16837.0, 32272.0, 117419.0, 741384.0, 57861.0, 24729.0, 13490.0, 7766.0, 4559.0, 2776.0, 1800.0, 1183.0, 770.0, 465.0, 358.0, 226.0, 145.0, 87.0, 59.0, 34.0, 21.0, 21.0, 16.0, 6.0, 8.0, 5.0, 5.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1070556640625, -0.1036367416381836, -0.10021781921386719, -0.09679889678955078, -0.09337997436523438, -0.08996105194091797, -0.08654212951660156, -0.08312320709228516, -0.07970428466796875, -0.07628536224365234, -0.07286643981933594, -0.06944751739501953, -0.06602859497070312, -0.06260967254638672, -0.05919075012207031, -0.055771827697753906, -0.0523529052734375, -0.048933982849121094, -0.04551506042480469, -0.04209613800048828, -0.038677215576171875, -0.03525829315185547, -0.03183937072753906, -0.028420448303222656, -0.02500152587890625, -0.021582603454589844, -0.018163681030273438, -0.014744758605957031, -0.011325836181640625, -0.007906913757324219, -0.0044879913330078125, -0.0010690689086914062, 0.002349853515625, 0.005768775939941406, 0.009187698364257812, 0.012606620788574219, 0.016025543212890625, 0.01944446563720703, 0.022863388061523438, 0.026282310485839844, 0.02970123291015625, 0.033120155334472656, 0.03653907775878906, 0.03995800018310547, 0.043376922607421875, 0.04679584503173828, 0.05021476745605469, 0.053633689880371094, 0.0570526123046875, 0.060471534729003906, 0.06389045715332031, 0.06730937957763672, 0.07072830200195312, 0.07414722442626953, 0.07756614685058594, 0.08098506927490234, 0.08440399169921875, 0.08782291412353516, 0.09124183654785156, 0.09466075897216797, 0.09807968139648438, 0.10149860382080078, 0.10491752624511719, 0.1083364486694336, 0.11175537109375]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 3.0, 10.0, 3.0, 10.0, 7.0, 10.0, 13.0, 10.0, 10.0, 35.0, 115.0, 426.0, 174.0, 43.0, 23.0, 15.0, 17.0, 12.0, 9.0, 5.0, 5.0, 6.0, 6.0, 2.0, 6.0, 5.0, 1.0, 3.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.035400390625, -0.03408527374267578, -0.03277015686035156, -0.031455039978027344, -0.030139923095703125, -0.028824806213378906, -0.027509689331054688, -0.02619457244873047, -0.02487945556640625, -0.02356433868408203, -0.022249221801757812, -0.020934104919433594, -0.019618988037109375, -0.018303871154785156, -0.016988754272460938, -0.01567363739013672, -0.0143585205078125, -0.013043403625488281, -0.011728286743164062, -0.010413169860839844, -0.009098052978515625, -0.007782936096191406, -0.0064678192138671875, -0.005152702331542969, -0.00383758544921875, -0.0025224685668945312, -0.0012073516845703125, 0.00010776519775390625, 0.001422882080078125, 0.0027379989624023438, 0.0040531158447265625, 0.005368232727050781, 0.006683349609375, 0.007998466491699219, 0.009313583374023438, 0.010628700256347656, 0.011943817138671875, 0.013258934020996094, 0.014574050903320312, 0.01588916778564453, 0.01720428466796875, 0.01851940155029297, 0.019834518432617188, 0.021149635314941406, 0.022464752197265625, 0.023779869079589844, 0.025094985961914062, 0.02641010284423828, 0.0277252197265625, 0.02904033660888672, 0.030355453491210938, 0.031670570373535156, 0.032985687255859375, 0.034300804138183594, 0.03561592102050781, 0.03693103790283203, 0.03824615478515625, 0.03956127166748047, 0.04087638854980469, 0.042191505432128906, 0.043506622314453125, 0.044821739196777344, 0.04613685607910156, 0.04745197296142578, 0.04876708984375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 10.0, 5.0, 12.0, 17.0, 16.0, 28.0, 27.0, 38.0, 58.0, 73.0, 124.0, 202.0, 360.0, 633.0, 1452.0, 3814.0, 12583.0, 51948.0, 282682.0, 537612.0, 120622.0, 25175.0, 6756.0, 2179.0, 889.0, 431.0, 295.0, 163.0, 96.0, 75.0, 59.0, 36.0, 21.0, 18.0, 20.0, 8.0, 8.0, 5.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.12451171875, -0.12076759338378906, -0.11702346801757812, -0.11327934265136719, -0.10953521728515625, -0.10579109191894531, -0.10204696655273438, -0.09830284118652344, -0.0945587158203125, -0.09081459045410156, -0.08707046508789062, -0.08332633972167969, -0.07958221435546875, -0.07583808898925781, -0.07209396362304688, -0.06834983825683594, -0.064605712890625, -0.06086158752441406, -0.057117462158203125, -0.05337333679199219, -0.04962921142578125, -0.04588508605957031, -0.042140960693359375, -0.03839683532714844, -0.0346527099609375, -0.030908584594726562, -0.027164459228515625, -0.023420333862304688, -0.01967620849609375, -0.015932083129882812, -0.012187957763671875, -0.008443832397460938, -0.00469970703125, -0.0009555816650390625, 0.002788543701171875, 0.0065326690673828125, 0.01027679443359375, 0.014020919799804688, 0.017765045166015625, 0.021509170532226562, 0.0252532958984375, 0.028997421264648438, 0.032741546630859375, 0.03648567199707031, 0.04022979736328125, 0.04397392272949219, 0.047718048095703125, 0.05146217346191406, 0.055206298828125, 0.05895042419433594, 0.06269454956054688, 0.06643867492675781, 0.07018280029296875, 0.07392692565917969, 0.07767105102539062, 0.08141517639160156, 0.0851593017578125, 0.08890342712402344, 0.09264755249023438, 0.09639167785644531, 0.10013580322265625, 0.10387992858886719, 0.10762405395507812, 0.11136817932128906, 0.1151123046875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 7.0, 2.0, 7.0, 6.0, 16.0, 11.0, 14.0, 5.0, 21.0, 16.0, 26.0, 26.0, 42.0, 45.0, 42.0, 40.0, 38.0, 41.0, 56.0, 42.0, 50.0, 42.0, 49.0, 55.0, 34.0, 43.0, 36.0, 46.0, 30.0, 24.0, 27.0, 17.0, 11.0, 8.0, 12.0, 8.0, 3.0, 6.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1649169921875, -0.1600475311279297, -0.15517807006835938, -0.15030860900878906, -0.14543914794921875, -0.14056968688964844, -0.13570022583007812, -0.1308307647705078, -0.1259613037109375, -0.12109184265136719, -0.11622238159179688, -0.11135292053222656, -0.10648345947265625, -0.10161399841308594, -0.09674453735351562, -0.09187507629394531, -0.087005615234375, -0.08213615417480469, -0.07726669311523438, -0.07239723205566406, -0.06752777099609375, -0.06265830993652344, -0.057788848876953125, -0.05291938781738281, -0.0480499267578125, -0.04318046569824219, -0.038311004638671875, -0.03344154357910156, -0.02857208251953125, -0.023702621459960938, -0.018833160400390625, -0.013963699340820312, -0.00909423828125, -0.0042247772216796875, 0.000644683837890625, 0.0055141448974609375, 0.01038360595703125, 0.015253067016601562, 0.020122528076171875, 0.024991989135742188, 0.0298614501953125, 0.03473091125488281, 0.039600372314453125, 0.04446983337402344, 0.04933929443359375, 0.05420875549316406, 0.059078216552734375, 0.06394767761230469, 0.068817138671875, 0.07368659973144531, 0.07855606079101562, 0.08342552185058594, 0.08829498291015625, 0.09316444396972656, 0.09803390502929688, 0.10290336608886719, 0.1077728271484375, 0.11264228820800781, 0.11751174926757812, 0.12238121032714844, 0.12725067138671875, 0.13212013244628906, 0.13698959350585938, 0.1418590545654297, 0.146728515625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 5.0, 2.0, 6.0, 4.0, 10.0, 15.0, 18.0, 19.0, 29.0, 37.0, 70.0, 100.0, 190.0, 310.0, 569.0, 1081.0, 2306.0, 6047.0, 20664.0, 132259.0, 711004.0, 141330.0, 21619.0, 6087.0, 2320.0, 1069.0, 553.0, 295.0, 196.0, 115.0, 65.0, 55.0, 37.0, 19.0, 13.0, 12.0, 10.0, 12.0, 0.0, 2.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10064697265625, -0.09745311737060547, -0.09425926208496094, -0.0910654067993164, -0.08787155151367188, -0.08467769622802734, -0.08148384094238281, -0.07828998565673828, -0.07509613037109375, -0.07190227508544922, -0.06870841979980469, -0.06551456451416016, -0.062320709228515625, -0.059126853942871094, -0.05593299865722656, -0.05273914337158203, -0.0495452880859375, -0.04635143280029297, -0.04315757751464844, -0.039963722229003906, -0.036769866943359375, -0.033576011657714844, -0.030382156372070312, -0.02718830108642578, -0.02399444580078125, -0.02080059051513672, -0.017606735229492188, -0.014412879943847656, -0.011219024658203125, -0.008025169372558594, -0.0048313140869140625, -0.0016374588012695312, 0.001556396484375, 0.004750251770019531, 0.007944107055664062, 0.011137962341308594, 0.014331817626953125, 0.017525672912597656, 0.020719528198242188, 0.02391338348388672, 0.02710723876953125, 0.03030109405517578, 0.03349494934082031, 0.036688804626464844, 0.039882659912109375, 0.043076515197753906, 0.04627037048339844, 0.04946422576904297, 0.0526580810546875, 0.05585193634033203, 0.05904579162597656, 0.062239646911621094, 0.06543350219726562, 0.06862735748291016, 0.07182121276855469, 0.07501506805419922, 0.07820892333984375, 0.08140277862548828, 0.08459663391113281, 0.08779048919677734, 0.09098434448242188, 0.0941781997680664, 0.09737205505371094, 0.10056591033935547, 0.103759765625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 9.0, 8.0, 14.0, 14.0, 19.0, 30.0, 25.0, 42.0, 49.0, 61.0, 85.0, 76.0, 113.0, 88.0, 73.0, 60.0, 50.0, 38.0, 40.0, 27.0, 24.0, 17.0, 6.0, 14.0, 7.0, 6.0, 3.0, 4.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.937980651855469e-05, -6.725545972585678e-05, -6.513111293315887e-05, -6.300676614046097e-05, -6.088241934776306e-05, -5.8758072555065155e-05, -5.663372576236725e-05, -5.450937896966934e-05, -5.2385032176971436e-05, -5.026068538427353e-05, -4.813633859157562e-05, -4.6011991798877716e-05, -4.388764500617981e-05, -4.17632982134819e-05, -3.9638951420783997e-05, -3.751460462808609e-05, -3.5390257835388184e-05, -3.326591104269028e-05, -3.114156424999237e-05, -2.9017217457294464e-05, -2.6892870664596558e-05, -2.476852387189865e-05, -2.2644177079200745e-05, -2.0519830286502838e-05, -1.839548349380493e-05, -1.6271136701107025e-05, -1.4146789908409119e-05, -1.2022443115711212e-05, -9.898096323013306e-06, -7.7737495303154e-06, -5.649402737617493e-06, -3.525055944919586e-06, -1.4007091522216797e-06, 7.236376404762268e-07, 2.8479844331741333e-06, 4.97233122587204e-06, 7.096678018569946e-06, 9.221024811267853e-06, 1.134537160396576e-05, 1.3469718396663666e-05, 1.5594065189361572e-05, 1.771841198205948e-05, 1.9842758774757385e-05, 2.1967105567455292e-05, 2.4091452360153198e-05, 2.6215799152851105e-05, 2.834014594554901e-05, 3.0464492738246918e-05, 3.2588839530944824e-05, 3.471318632364273e-05, 3.683753311634064e-05, 3.8961879909038544e-05, 4.108622670173645e-05, 4.321057349443436e-05, 4.533492028713226e-05, 4.745926707983017e-05, 4.9583613872528076e-05, 5.170796066522598e-05, 5.383230745792389e-05, 5.5956654250621796e-05, 5.80810010433197e-05, 6.020534783601761e-05, 6.232969462871552e-05, 6.445404142141342e-05, 6.657838821411133e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 6.0, 9.0, 10.0, 17.0, 28.0, 42.0, 46.0, 70.0, 127.0, 227.0, 369.0, 666.0, 1467.0, 3345.0, 9386.0, 34111.0, 201537.0, 608187.0, 147780.0, 27437.0, 8088.0, 2860.0, 1235.0, 667.0, 341.0, 189.0, 106.0, 66.0, 39.0, 32.0, 17.0, 11.0, 7.0, 10.0, 7.0, 5.0, 5.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09368896484375, -0.09096717834472656, -0.08824539184570312, -0.08552360534667969, -0.08280181884765625, -0.08008003234863281, -0.07735824584960938, -0.07463645935058594, -0.0719146728515625, -0.06919288635253906, -0.06647109985351562, -0.06374931335449219, -0.06102752685546875, -0.05830574035644531, -0.055583953857421875, -0.05286216735839844, -0.050140380859375, -0.04741859436035156, -0.044696807861328125, -0.04197502136230469, -0.03925323486328125, -0.03653144836425781, -0.033809661865234375, -0.031087875366210938, -0.0283660888671875, -0.025644302368164062, -0.022922515869140625, -0.020200729370117188, -0.01747894287109375, -0.014757156372070312, -0.012035369873046875, -0.009313583374023438, -0.006591796875, -0.0038700103759765625, -0.001148223876953125, 0.0015735626220703125, 0.00429534912109375, 0.0070171356201171875, 0.009738922119140625, 0.012460708618164062, 0.0151824951171875, 0.017904281616210938, 0.020626068115234375, 0.023347854614257812, 0.02606964111328125, 0.028791427612304688, 0.031513214111328125, 0.03423500061035156, 0.036956787109375, 0.03967857360839844, 0.042400360107421875, 0.04512214660644531, 0.04784393310546875, 0.05056571960449219, 0.053287506103515625, 0.05600929260253906, 0.0587310791015625, 0.06145286560058594, 0.06417465209960938, 0.06689643859863281, 0.06961822509765625, 0.07234001159667969, 0.07506179809570312, 0.07778358459472656, 0.08050537109375]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 5.0, 3.0, 9.0, 12.0, 13.0, 32.0, 34.0, 46.0, 60.0, 88.0, 103.0, 108.0, 99.0, 96.0, 71.0, 59.0, 51.0, 20.0, 17.0, 21.0, 17.0, 8.0, 6.0, 7.0, 3.0, 4.0, 7.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09527587890625, -0.0922842025756836, -0.08929252624511719, -0.08630084991455078, -0.08330917358398438, -0.08031749725341797, -0.07732582092285156, -0.07433414459228516, -0.07134246826171875, -0.06835079193115234, -0.06535911560058594, -0.06236743927001953, -0.059375762939453125, -0.05638408660888672, -0.05339241027832031, -0.050400733947753906, -0.0474090576171875, -0.044417381286621094, -0.04142570495605469, -0.03843402862548828, -0.035442352294921875, -0.03245067596435547, -0.029458999633789062, -0.026467323303222656, -0.02347564697265625, -0.020483970642089844, -0.017492294311523438, -0.014500617980957031, -0.011508941650390625, -0.008517265319824219, -0.0055255889892578125, -0.0025339126586914062, 0.000457763671875, 0.0034494400024414062, 0.0064411163330078125, 0.009432792663574219, 0.012424468994140625, 0.015416145324707031, 0.018407821655273438, 0.021399497985839844, 0.02439117431640625, 0.027382850646972656, 0.030374526977539062, 0.03336620330810547, 0.036357879638671875, 0.03934955596923828, 0.04234123229980469, 0.045332908630371094, 0.0483245849609375, 0.051316261291503906, 0.05430793762207031, 0.05729961395263672, 0.060291290283203125, 0.06328296661376953, 0.06627464294433594, 0.06926631927490234, 0.07225799560546875, 0.07524967193603516, 0.07824134826660156, 0.08123302459716797, 0.08422470092773438, 0.08721637725830078, 0.09020805358886719, 0.0931997299194336, 0.09619140625]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 7.0, 18.0, 39.0, 155.0, 423.0, 247.0, 74.0, 27.0, 9.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6697742938995361, -1.6020219326019287, -1.5342695713043213, -1.4665172100067139, -1.3987648487091064, -1.331012487411499, -1.2632602453231812, -1.1955078840255737, -1.1277555227279663, -1.0600031614303589, -0.9922508001327515, -0.9244984984397888, -0.8567461371421814, -0.788993775844574, -0.7212414741516113, -0.6534891128540039, -0.5857367515563965, -0.5179843902587891, -0.45023205876350403, -0.382479727268219, -0.3147273659706116, -0.24697500467300415, -0.17922267317771912, -0.11147034168243408, -0.04371798038482666, 0.024034366011619568, 0.0917867124080658, 0.15953905880451202, 0.22729140520095825, 0.2950437664985657, 0.3627960979938507, 0.43054842948913574, 0.49830102920532227, 0.5660533905029297, 0.6338057518005371, 0.7015580534934998, 0.7693104147911072, 0.8370627760887146, 0.9048150777816772, 0.9725674390792847, 1.040319800376892, 1.1080721616744995, 1.175824522972107, 1.2435768842697144, 1.3113291263580322, 1.3790814876556396, 1.446833848953247, 1.5145862102508545, 1.582338571548462, 1.6500909328460693, 1.7178432941436768, 1.7855956554412842, 1.8533480167388916, 1.921100378036499, 1.988852620124817, 2.0566048622131348, 2.124357223510742, 2.1921095848083496, 2.259861946105957, 2.3276143074035645, 2.395366668701172, 2.4631190299987793, 2.5308713912963867, 2.598623752593994, 2.6663761138916016]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 4.0, 4.0, 0.0, 3.0, 5.0, 2.0, 1.0, 4.0, 2.0, 5.0, 3.0, 6.0, 5.0, 9.0, 20.0, 17.0, 36.0, 77.0, 102.0, 149.0, 172.0, 124.0, 95.0, 48.0, 32.0, 18.0, 11.0, 8.0, 5.0, 2.0, 8.0, 5.0, 5.0, 6.0, 3.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.358370304107666, -2.277796745300293, -2.197222948074341, -2.1166493892669678, -2.0360758304595947, -1.9555021524429321, -1.8749284744262695, -1.7943549156188965, -1.7137812376022339, -1.6332075595855713, -1.5526340007781982, -1.4720603227615356, -1.391486644744873, -1.3109130859375, -1.2303394079208374, -1.1497657299041748, -1.0691921710968018, -0.9886185526847839, -0.9080449342727661, -0.8274712562561035, -0.7468976378440857, -0.6663240194320679, -0.5857503414154053, -0.5051767230033875, -0.42460310459136963, -0.3440294861793518, -0.2634558379650116, -0.18288220465183258, -0.10230857133865356, -0.021734952926635742, 0.05883869528770447, 0.13941234350204468, 0.2199862003326416, 0.3005598187446594, 0.38113346695899963, 0.46170711517333984, 0.5422807335853577, 0.6228543519973755, 0.7034280300140381, 0.7840016484260559, 0.8645752668380737, 0.9451488852500916, 1.0257225036621094, 1.106296181678772, 1.1868698596954346, 1.2674434185028076, 1.3480170965194702, 1.4285907745361328, 1.5091643333435059, 1.5897380113601685, 1.6703115701675415, 1.750885248184204, 1.8314588069915771, 1.9120324850082397, 1.9926061630249023, 2.0731797218322754, 2.1537532806396484, 2.2343268394470215, 2.3149006366729736, 2.3954741954803467, 2.4760477542877197, 2.556621551513672, 2.637195110321045, 2.717768669128418, 2.79834246635437]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 9.0, 15.0, 23.0, 40.0, 59.0, 108.0, 175.0, 274.0, 552.0, 1007.0, 1830.0, 3658.0, 8121.0, 22266.0, 103346.0, 3837715.0, 162614.0, 30421.0, 10963.0, 4888.0, 2523.0, 1414.0, 793.0, 485.0, 303.0, 215.0, 150.0, 96.0, 71.0, 40.0, 34.0, 20.0, 15.0, 15.0, 9.0, 8.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2498779296875, -0.23972129821777344, -0.22956466674804688, -0.2194080352783203, -0.20925140380859375, -0.1990947723388672, -0.18893814086914062, -0.17878150939941406, -0.1686248779296875, -0.15846824645996094, -0.14831161499023438, -0.1381549835205078, -0.12799835205078125, -0.11784172058105469, -0.10768508911132812, -0.09752845764160156, -0.087371826171875, -0.07721519470214844, -0.06705856323242188, -0.05690193176269531, -0.04674530029296875, -0.03658866882324219, -0.026432037353515625, -0.016275405883789062, -0.0061187744140625, 0.0040378570556640625, 0.014194488525390625, 0.024351119995117188, 0.03450775146484375, 0.04466438293457031, 0.054821014404296875, 0.06497764587402344, 0.07513427734375, 0.08529090881347656, 0.09544754028320312, 0.10560417175292969, 0.11576080322265625, 0.1259174346923828, 0.13607406616210938, 0.14623069763183594, 0.1563873291015625, 0.16654396057128906, 0.17670059204101562, 0.1868572235107422, 0.19701385498046875, 0.2071704864501953, 0.21732711791992188, 0.22748374938964844, 0.237640380859375, 0.24779701232910156, 0.2579536437988281, 0.2681102752685547, 0.27826690673828125, 0.2884235382080078, 0.2985801696777344, 0.30873680114746094, 0.3188934326171875, 0.32905006408691406, 0.3392066955566406, 0.3493633270263672, 0.35951995849609375, 0.3696765899658203, 0.3798332214355469, 0.38998985290527344, 0.400146484375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 6.0, 4.0, 4.0, 7.0, 12.0, 11.0, 3.0, 7.0, 5.0, 11.0, 15.0, 23.0, 43.0, 106.0, 249.0, 243.0, 86.0, 50.0, 28.0, 13.0, 16.0, 8.0, 12.0, 4.0, 5.0, 9.0, 8.0, 2.0, 3.0, 3.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0264129638671875, -0.02527642250061035, -0.024139881134033203, -0.023003339767456055, -0.021866798400878906, -0.020730257034301758, -0.01959371566772461, -0.01845717430114746, -0.017320632934570312, -0.016184091567993164, -0.015047550201416016, -0.013911008834838867, -0.012774467468261719, -0.01163792610168457, -0.010501384735107422, -0.009364843368530273, -0.008228302001953125, -0.0070917606353759766, -0.005955219268798828, -0.00481867790222168, -0.0036821365356445312, -0.002545595169067383, -0.0014090538024902344, -0.00027251243591308594, 0.0008640289306640625, 0.002000570297241211, 0.0031371116638183594, 0.004273653030395508, 0.005410194396972656, 0.006546735763549805, 0.007683277130126953, 0.008819818496704102, 0.00995635986328125, 0.011092901229858398, 0.012229442596435547, 0.013365983963012695, 0.014502525329589844, 0.015639066696166992, 0.01677560806274414, 0.01791214942932129, 0.019048690795898438, 0.020185232162475586, 0.021321773529052734, 0.022458314895629883, 0.02359485626220703, 0.02473139762878418, 0.025867938995361328, 0.027004480361938477, 0.028141021728515625, 0.029277563095092773, 0.030414104461669922, 0.03155064582824707, 0.03268718719482422, 0.03382372856140137, 0.034960269927978516, 0.036096811294555664, 0.03723335266113281, 0.03836989402770996, 0.03950643539428711, 0.04064297676086426, 0.041779518127441406, 0.042916059494018555, 0.0440526008605957, 0.04518914222717285, 0.04632568359375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 2.0, 0.0, 5.0, 8.0, 7.0, 10.0, 18.0, 18.0, 20.0, 32.0, 74.0, 117.0, 229.0, 495.0, 988.0, 2463.0, 6997.0, 26518.0, 146049.0, 2768118.0, 1119661.0, 94178.0, 19174.0, 5437.0, 1876.0, 876.0, 354.0, 238.0, 118.0, 64.0, 56.0, 25.0, 19.0, 11.0, 5.0, 8.0, 7.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.2646484375, -0.2570629119873047, -0.24947738647460938, -0.24189186096191406, -0.23430633544921875, -0.22672080993652344, -0.21913528442382812, -0.2115497589111328, -0.2039642333984375, -0.1963787078857422, -0.18879318237304688, -0.18120765686035156, -0.17362213134765625, -0.16603660583496094, -0.15845108032226562, -0.1508655548095703, -0.143280029296875, -0.1356945037841797, -0.12810897827148438, -0.12052345275878906, -0.11293792724609375, -0.10535240173339844, -0.09776687622070312, -0.09018135070800781, -0.0825958251953125, -0.07501029968261719, -0.06742477416992188, -0.05983924865722656, -0.05225372314453125, -0.04466819763183594, -0.037082672119140625, -0.029497146606445312, -0.02191162109375, -0.014326095581054688, -0.006740570068359375, 0.0008449554443359375, 0.00843048095703125, 0.016016006469726562, 0.023601531982421875, 0.031187057495117188, 0.0387725830078125, 0.04635810852050781, 0.053943634033203125, 0.06152915954589844, 0.06911468505859375, 0.07670021057128906, 0.08428573608398438, 0.09187126159667969, 0.099456787109375, 0.10704231262207031, 0.11462783813476562, 0.12221336364746094, 0.12979888916015625, 0.13738441467285156, 0.14496994018554688, 0.1525554656982422, 0.1601409912109375, 0.1677265167236328, 0.17531204223632812, 0.18289756774902344, 0.19048309326171875, 0.19806861877441406, 0.20565414428710938, 0.2132396697998047, 0.2208251953125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 6.0, 6.0, 7.0, 11.0, 10.0, 17.0, 27.0, 35.0, 43.0, 56.0, 111.0, 180.0, 294.0, 620.0, 1366.0, 541.0, 271.0, 153.0, 103.0, 63.0, 42.0, 34.0, 17.0, 12.0, 17.0, 8.0, 7.0, 2.0, 2.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.037353515625, -0.036038875579833984, -0.03472423553466797, -0.03340959548950195, -0.03209495544433594, -0.030780315399169922, -0.029465675354003906, -0.02815103530883789, -0.026836395263671875, -0.02552175521850586, -0.024207115173339844, -0.022892475128173828, -0.021577835083007812, -0.020263195037841797, -0.01894855499267578, -0.017633914947509766, -0.01631927490234375, -0.015004634857177734, -0.013689994812011719, -0.012375354766845703, -0.011060714721679688, -0.009746074676513672, -0.008431434631347656, -0.007116794586181641, -0.005802154541015625, -0.004487514495849609, -0.0031728744506835938, -0.0018582344055175781, -0.0005435943603515625, 0.0007710456848144531, 0.0020856857299804688, 0.0034003257751464844, 0.0047149658203125, 0.006029605865478516, 0.007344245910644531, 0.008658885955810547, 0.009973526000976562, 0.011288166046142578, 0.012602806091308594, 0.01391744613647461, 0.015232086181640625, 0.01654672622680664, 0.017861366271972656, 0.019176006317138672, 0.020490646362304688, 0.021805286407470703, 0.02311992645263672, 0.024434566497802734, 0.02574920654296875, 0.027063846588134766, 0.02837848663330078, 0.029693126678466797, 0.031007766723632812, 0.03232240676879883, 0.033637046813964844, 0.03495168685913086, 0.036266326904296875, 0.03758096694946289, 0.038895606994628906, 0.04021024703979492, 0.04152488708496094, 0.04283952713012695, 0.04415416717529297, 0.045468807220458984, 0.046783447265625]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 9.0, 28.0, 99.0, 261.0, 338.0, 181.0, 59.0, 14.0, 7.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.20842024683952332, -0.19268736243247986, -0.1769544780254364, -0.16122160851955414, -0.14548872411251068, -0.12975583970546722, -0.11402296274900436, -0.0982900857925415, -0.08255720138549805, -0.06682431697845459, -0.05109144002199173, -0.03535855934023857, -0.019625678658485413, -0.0038927942514419556, 0.011840082705020905, 0.027572959661483765, 0.04330584406852722, 0.05903872475028038, 0.07477160543203354, 0.0905044823884964, 0.10623736679553986, 0.12197025120258331, 0.13770312070846558, 0.15343600511550903, 0.1691688895225525, 0.18490177392959595, 0.2006346583366394, 0.21636752784252167, 0.23210041224956512, 0.24783329665660858, 0.26356616616249084, 0.2792990505695343, 0.29503196477890015, 0.3107648491859436, 0.32649773359298706, 0.3422306180000305, 0.357963502407074, 0.37369638681411743, 0.3894292414188385, 0.40516212582588196, 0.4208950102329254, 0.43662789463996887, 0.45236077904701233, 0.4680936634540558, 0.48382651805877686, 0.4995594024658203, 0.5152922868728638, 0.5310251712799072, 0.5467580556869507, 0.5624909400939941, 0.5782238245010376, 0.593956708908081, 0.6096895933151245, 0.625422477722168, 0.6411553621292114, 0.6568882465362549, 0.6726211309432983, 0.6883540153503418, 0.7040868997573853, 0.7198197841644287, 0.7355526685714722, 0.7512855529785156, 0.7670184373855591, 0.7827513217926025, 0.7984841465950012]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 1.0, 3.0, 2.0, 3.0, 4.0, 12.0, 8.0, 5.0, 8.0, 13.0, 13.0, 19.0, 28.0, 27.0, 34.0, 37.0, 59.0, 79.0, 59.0, 67.0, 68.0, 51.0, 62.0, 58.0, 49.0, 50.0, 41.0, 25.0, 22.0, 17.0, 17.0, 16.0, 12.0, 5.0, 2.0, 8.0, 2.0, 4.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1761237382888794, -0.17084665596485138, -0.16556957364082336, -0.16029249131679535, -0.15501540899276733, -0.1497383415699005, -0.1444612592458725, -0.13918417692184448, -0.13390709459781647, -0.12863001227378845, -0.12335292994976044, -0.11807585507631302, -0.112798772752285, -0.10752169042825699, -0.10224461555480957, -0.09696753323078156, -0.09169045090675354, -0.08641336858272552, -0.08113628625869751, -0.07585921138525009, -0.07058212906122208, -0.06530504673719406, -0.060027968138456345, -0.05475088953971863, -0.04947380721569061, -0.0441967248916626, -0.03891964629292488, -0.033642567694187164, -0.02836548537015915, -0.023088404908776283, -0.017811324447393417, -0.0125342458486557, -0.0072571635246276855, -0.0019800830632448196, 0.0032969973981380463, 0.008574077859520912, 0.013851158320903778, 0.019128238782286644, 0.02440531924366951, 0.029682397842407227, 0.03495948016643524, 0.04023656249046326, 0.045513641089200974, 0.05079071968793869, 0.056067802011966705, 0.06134488433599472, 0.06662195920944214, 0.07189904153347015, 0.07717612385749817, 0.08245320618152618, 0.0877302885055542, 0.09300736337900162, 0.09828444570302963, 0.10356152802705765, 0.10883860290050507, 0.11411568522453308, 0.1193927675485611, 0.12466984987258911, 0.12994693219661713, 0.13522401452064514, 0.14050108194351196, 0.14577816426753998, 0.151055246591568, 0.156332328915596, 0.16160941123962402]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 8.0, 14.0, 16.0, 8.0, 31.0, 41.0, 55.0, 73.0, 147.0, 199.0, 315.0, 463.0, 843.0, 1517.0, 2878.0, 5723.0, 12987.0, 33880.0, 184311.0, 691728.0, 72686.0, 22046.0, 9374.0, 4240.0, 2189.0, 1098.0, 659.0, 379.0, 214.0, 150.0, 78.0, 79.0, 39.0, 30.0, 16.0, 17.0, 10.0, 11.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.209228515625, -0.2031269073486328, -0.19702529907226562, -0.19092369079589844, -0.18482208251953125, -0.17872047424316406, -0.17261886596679688, -0.1665172576904297, -0.1604156494140625, -0.1543140411376953, -0.14821243286132812, -0.14211082458496094, -0.13600921630859375, -0.12990760803222656, -0.12380599975585938, -0.11770439147949219, -0.111602783203125, -0.10550117492675781, -0.09939956665039062, -0.09329795837402344, -0.08719635009765625, -0.08109474182128906, -0.07499313354492188, -0.06889152526855469, -0.0627899169921875, -0.05668830871582031, -0.050586700439453125, -0.04448509216308594, -0.03838348388671875, -0.03228187561035156, -0.026180267333984375, -0.020078659057617188, -0.01397705078125, -0.007875442504882812, -0.001773834228515625, 0.0043277740478515625, 0.01042938232421875, 0.016530990600585938, 0.022632598876953125, 0.028734207153320312, 0.0348358154296875, 0.04093742370605469, 0.047039031982421875, 0.05314064025878906, 0.05924224853515625, 0.06534385681152344, 0.07144546508789062, 0.07754707336425781, 0.083648681640625, 0.08975028991699219, 0.09585189819335938, 0.10195350646972656, 0.10805511474609375, 0.11415672302246094, 0.12025833129882812, 0.1263599395751953, 0.1324615478515625, 0.1385631561279297, 0.14466476440429688, 0.15076637268066406, 0.15686798095703125, 0.16296958923339844, 0.16907119750976562, 0.1751728057861328, 0.1812744140625]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 7.0, 1.0, 11.0, 3.0, 6.0, 6.0, 11.0, 15.0, 14.0, 27.0, 41.0, 76.0, 171.0, 213.0, 164.0, 80.0, 43.0, 28.0, 13.0, 11.0, 12.0, 10.0, 5.0, 6.0, 1.0, 10.0, 2.0, 3.0, 1.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0226287841796875, -0.021587610244750977, -0.020546436309814453, -0.01950526237487793, -0.018464088439941406, -0.017422914505004883, -0.01638174057006836, -0.015340566635131836, -0.014299392700195312, -0.013258218765258789, -0.012217044830322266, -0.011175870895385742, -0.010134696960449219, -0.009093523025512695, -0.008052349090576172, -0.0070111751556396484, -0.005970001220703125, -0.0049288272857666016, -0.003887653350830078, -0.0028464794158935547, -0.0018053054809570312, -0.0007641315460205078, 0.0002770423889160156, 0.001318216323852539, 0.0023593902587890625, 0.003400564193725586, 0.004441738128662109, 0.005482912063598633, 0.006524085998535156, 0.00756525993347168, 0.008606433868408203, 0.009647607803344727, 0.01068878173828125, 0.011729955673217773, 0.012771129608154297, 0.01381230354309082, 0.014853477478027344, 0.015894651412963867, 0.01693582534790039, 0.017976999282836914, 0.019018173217773438, 0.02005934715270996, 0.021100521087646484, 0.022141695022583008, 0.02318286895751953, 0.024224042892456055, 0.025265216827392578, 0.0263063907623291, 0.027347564697265625, 0.02838873863220215, 0.029429912567138672, 0.030471086502075195, 0.03151226043701172, 0.03255343437194824, 0.033594608306884766, 0.03463578224182129, 0.03567695617675781, 0.036718130111694336, 0.03775930404663086, 0.03880047798156738, 0.039841651916503906, 0.04088282585144043, 0.04192399978637695, 0.04296517372131348, 0.04400634765625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 8.0, 7.0, 9.0, 27.0, 29.0, 46.0, 73.0, 118.0, 277.0, 476.0, 1112.0, 3023.0, 10420.0, 57537.0, 477385.0, 430440.0, 52129.0, 10093.0, 3055.0, 1184.0, 526.0, 224.0, 162.0, 77.0, 42.0, 29.0, 19.0, 13.0, 4.0, 7.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1614990234375, -0.15628433227539062, -0.15106964111328125, -0.14585494995117188, -0.1406402587890625, -0.13542556762695312, -0.13021087646484375, -0.12499618530273438, -0.119781494140625, -0.11456680297851562, -0.10935211181640625, -0.10413742065429688, -0.0989227294921875, -0.09370803833007812, -0.08849334716796875, -0.08327865600585938, -0.07806396484375, -0.07284927368164062, -0.06763458251953125, -0.062419891357421875, -0.0572052001953125, -0.051990509033203125, -0.04677581787109375, -0.041561126708984375, -0.036346435546875, -0.031131744384765625, -0.02591705322265625, -0.020702362060546875, -0.0154876708984375, -0.010272979736328125, -0.00505828857421875, 0.000156402587890625, 0.00537109375, 0.010585784912109375, 0.01580047607421875, 0.021015167236328125, 0.0262298583984375, 0.031444549560546875, 0.03665924072265625, 0.041873931884765625, 0.047088623046875, 0.052303314208984375, 0.05751800537109375, 0.06273269653320312, 0.0679473876953125, 0.07316207885742188, 0.07837677001953125, 0.08359146118164062, 0.08880615234375, 0.09402084350585938, 0.09923553466796875, 0.10445022583007812, 0.1096649169921875, 0.11487960815429688, 0.12009429931640625, 0.12530899047851562, 0.130523681640625, 0.13573837280273438, 0.14095306396484375, 0.14616775512695312, 0.1513824462890625, 0.15659713745117188, 0.16181182861328125, 0.16702651977539062, 0.1722412109375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 8.0, 6.0, 8.0, 16.0, 7.0, 19.0, 16.0, 23.0, 29.0, 26.0, 32.0, 37.0, 43.0, 31.0, 46.0, 39.0, 49.0, 47.0, 55.0, 44.0, 43.0, 38.0, 41.0, 36.0, 34.0, 38.0, 36.0, 16.0, 26.0, 19.0, 20.0, 15.0, 16.0, 9.0, 9.0, 5.0, 2.0, 6.0, 5.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.09246826171875, -0.08959674835205078, -0.08672523498535156, -0.08385372161865234, -0.08098220825195312, -0.0781106948852539, -0.07523918151855469, -0.07236766815185547, -0.06949615478515625, -0.06662464141845703, -0.06375312805175781, -0.060881614685058594, -0.058010101318359375, -0.055138587951660156, -0.05226707458496094, -0.04939556121826172, -0.0465240478515625, -0.04365253448486328, -0.04078102111816406, -0.037909507751464844, -0.035037994384765625, -0.032166481018066406, -0.029294967651367188, -0.02642345428466797, -0.02355194091796875, -0.02068042755126953, -0.017808914184570312, -0.014937400817871094, -0.012065887451171875, -0.009194374084472656, -0.0063228607177734375, -0.0034513473510742188, -0.000579833984375, 0.0022916793823242188, 0.0051631927490234375, 0.008034706115722656, 0.010906219482421875, 0.013777732849121094, 0.016649246215820312, 0.01952075958251953, 0.02239227294921875, 0.02526378631591797, 0.028135299682617188, 0.031006813049316406, 0.033878326416015625, 0.036749839782714844, 0.03962135314941406, 0.04249286651611328, 0.0453643798828125, 0.04823589324951172, 0.05110740661621094, 0.053978919982910156, 0.056850433349609375, 0.059721946716308594, 0.06259346008300781, 0.06546497344970703, 0.06833648681640625, 0.07120800018310547, 0.07407951354980469, 0.0769510269165039, 0.07982254028320312, 0.08269405364990234, 0.08556556701660156, 0.08843708038330078, 0.09130859375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 5.0, 5.0, 7.0, 8.0, 22.0, 21.0, 51.0, 92.0, 173.0, 349.0, 775.0, 1945.0, 6418.0, 31088.0, 296824.0, 622466.0, 71496.0, 11666.0, 3044.0, 1146.0, 451.0, 219.0, 110.0, 67.0, 40.0, 23.0, 12.0, 11.0, 9.0, 1.0, 6.0, 6.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.204345703125, -0.19854164123535156, -0.19273757934570312, -0.1869335174560547, -0.18112945556640625, -0.1753253936767578, -0.16952133178710938, -0.16371726989746094, -0.1579132080078125, -0.15210914611816406, -0.14630508422851562, -0.1405010223388672, -0.13469696044921875, -0.1288928985595703, -0.12308883666992188, -0.11728477478027344, -0.111480712890625, -0.10567665100097656, -0.09987258911132812, -0.09406852722167969, -0.08826446533203125, -0.08246040344238281, -0.07665634155273438, -0.07085227966308594, -0.0650482177734375, -0.05924415588378906, -0.053440093994140625, -0.04763603210449219, -0.04183197021484375, -0.03602790832519531, -0.030223846435546875, -0.024419784545898438, -0.01861572265625, -0.012811660766601562, -0.007007598876953125, -0.0012035369873046875, 0.00460052490234375, 0.010404586791992188, 0.016208648681640625, 0.022012710571289062, 0.0278167724609375, 0.03362083435058594, 0.039424896240234375, 0.04522895812988281, 0.05103302001953125, 0.05683708190917969, 0.06264114379882812, 0.06844520568847656, 0.074249267578125, 0.08005332946777344, 0.08585739135742188, 0.09166145324707031, 0.09746551513671875, 0.10326957702636719, 0.10907363891601562, 0.11487770080566406, 0.1206817626953125, 0.12648582458496094, 0.13228988647460938, 0.1380939483642578, 0.14389801025390625, 0.1497020721435547, 0.15550613403320312, 0.16131019592285156, 0.1671142578125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 4.0, 6.0, 7.0, 17.0, 10.0, 11.0, 26.0, 39.0, 51.0, 61.0, 91.0, 106.0, 113.0, 110.0, 91.0, 70.0, 49.0, 36.0, 31.0, 21.0, 26.0, 6.0, 3.0, 8.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.196996688842773e-05, -8.819904178380966e-05, -8.442811667919159e-05, -8.065719157457352e-05, -7.688626646995544e-05, -7.311534136533737e-05, -6.93444162607193e-05, -6.557349115610123e-05, -6.180256605148315e-05, -5.803164094686508e-05, -5.426071584224701e-05, -5.048979073762894e-05, -4.6718865633010864e-05, -4.294794052839279e-05, -3.917701542377472e-05, -3.540609031915665e-05, -3.1635165214538574e-05, -2.7864240109920502e-05, -2.409331500530243e-05, -2.0322389900684357e-05, -1.6551464796066284e-05, -1.2780539691448212e-05, -9.00961458683014e-06, -5.238689482212067e-06, -1.4677643775939941e-06, 2.3031607270240784e-06, 6.074085831642151e-06, 9.845010936260223e-06, 1.3615936040878296e-05, 1.738686114549637e-05, 2.115778625011444e-05, 2.4928711354732513e-05, 2.8699636459350586e-05, 3.247056156396866e-05, 3.624148666858673e-05, 4.0012411773204803e-05, 4.3783336877822876e-05, 4.755426198244095e-05, 5.132518708705902e-05, 5.5096112191677094e-05, 5.8867037296295166e-05, 6.263796240091324e-05, 6.640888750553131e-05, 7.017981261014938e-05, 7.395073771476746e-05, 7.772166281938553e-05, 8.14925879240036e-05, 8.526351302862167e-05, 8.903443813323975e-05, 9.280536323785782e-05, 9.657628834247589e-05, 0.00010034721344709396, 0.00010411813855171204, 0.00010788906365633011, 0.00011165998876094818, 0.00011543091386556625, 0.00011920183897018433, 0.0001229727640748024, 0.00012674368917942047, 0.00013051461428403854, 0.00013428553938865662, 0.0001380564644932747, 0.00014182738959789276, 0.00014559831470251083, 0.0001493692398071289]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 7.0, 17.0, 12.0, 18.0, 30.0, 45.0, 65.0, 108.0, 169.0, 301.0, 561.0, 1001.0, 2202.0, 5517.0, 16139.0, 61198.0, 268637.0, 475423.0, 160209.0, 37659.0, 11178.0, 4094.0, 1802.0, 960.0, 470.0, 274.0, 169.0, 89.0, 72.0, 39.0, 32.0, 23.0, 15.0, 5.0, 6.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10064697265625, -0.0972137451171875, -0.093780517578125, -0.0903472900390625, -0.0869140625, -0.0834808349609375, -0.080047607421875, -0.0766143798828125, -0.07318115234375, -0.0697479248046875, -0.066314697265625, -0.0628814697265625, -0.0594482421875, -0.0560150146484375, -0.052581787109375, -0.0491485595703125, -0.04571533203125, -0.0422821044921875, -0.038848876953125, -0.0354156494140625, -0.031982421875, -0.0285491943359375, -0.025115966796875, -0.0216827392578125, -0.01824951171875, -0.0148162841796875, -0.011383056640625, -0.0079498291015625, -0.0045166015625, -0.0010833740234375, 0.002349853515625, 0.0057830810546875, 0.00921630859375, 0.0126495361328125, 0.016082763671875, 0.0195159912109375, 0.02294921875, 0.0263824462890625, 0.029815673828125, 0.0332489013671875, 0.03668212890625, 0.0401153564453125, 0.043548583984375, 0.0469818115234375, 0.0504150390625, 0.0538482666015625, 0.057281494140625, 0.0607147216796875, 0.06414794921875, 0.0675811767578125, 0.071014404296875, 0.0744476318359375, 0.077880859375, 0.0813140869140625, 0.084747314453125, 0.0881805419921875, 0.09161376953125, 0.0950469970703125, 0.098480224609375, 0.1019134521484375, 0.1053466796875, 0.1087799072265625, 0.112213134765625, 0.1156463623046875, 0.11907958984375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 3.0, 5.0, 8.0, 10.0, 6.0, 11.0, 18.0, 21.0, 36.0, 36.0, 38.0, 61.0, 69.0, 85.0, 106.0, 86.0, 67.0, 63.0, 59.0, 47.0, 45.0, 27.0, 25.0, 23.0, 11.0, 9.0, 8.0, 10.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0635986328125, -0.06102466583251953, -0.05845069885253906, -0.055876731872558594, -0.053302764892578125, -0.050728797912597656, -0.04815483093261719, -0.04558086395263672, -0.04300689697265625, -0.04043292999267578, -0.03785896301269531, -0.035284996032714844, -0.032711029052734375, -0.030137062072753906, -0.027563095092773438, -0.02498912811279297, -0.0224151611328125, -0.01984119415283203, -0.017267227172851562, -0.014693260192871094, -0.012119293212890625, -0.009545326232910156, -0.0069713592529296875, -0.004397392272949219, -0.00182342529296875, 0.0007505416870117188, 0.0033245086669921875, 0.005898475646972656, 0.008472442626953125, 0.011046409606933594, 0.013620376586914062, 0.01619434356689453, 0.018768310546875, 0.02134227752685547, 0.023916244506835938, 0.026490211486816406, 0.029064178466796875, 0.031638145446777344, 0.03421211242675781, 0.03678607940673828, 0.03936004638671875, 0.04193401336669922, 0.04450798034667969, 0.047081947326660156, 0.049655914306640625, 0.052229881286621094, 0.05480384826660156, 0.05737781524658203, 0.0599517822265625, 0.06252574920654297, 0.06509971618652344, 0.0676736831665039, 0.07024765014648438, 0.07282161712646484, 0.07539558410644531, 0.07796955108642578, 0.08054351806640625, 0.08311748504638672, 0.08569145202636719, 0.08826541900634766, 0.09083938598632812, 0.0934133529663086, 0.09598731994628906, 0.09856128692626953, 0.10113525390625]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 21.0, 121.0, 438.0, 353.0, 48.0, 14.0, 5.0, 3.0, 6.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1782442331314087, -1.1036667823791504, -1.029089331626892, -0.9545119404792786, -0.8799344897270203, -0.805357038974762, -0.7307796478271484, -0.6562021970748901, -0.5816247463226318, -0.5070472955703735, -0.4324698746204376, -0.3578924536705017, -0.2833150029182434, -0.2087375521659851, -0.1341601312160492, -0.05958271026611328, 0.01499474048614502, 0.08957217633724213, 0.16414961218833923, 0.23872704803943634, 0.31330448389053345, 0.38788193464279175, 0.46245935559272766, 0.5370367765426636, 0.6116142272949219, 0.6861916780471802, 0.7607691287994385, 0.835346519947052, 0.9099239706993103, 0.9845014214515686, 1.0590788125991821, 1.1336562633514404, 1.2082338333129883, 1.2828112840652466, 1.3573887348175049, 1.4319661855697632, 1.5065436363220215, 1.5811209678649902, 1.6556984186172485, 1.7302758693695068, 1.8048533201217651, 1.8794307708740234, 1.9540082216262817, 2.02858567237854, 2.103163003921509, 2.1777405738830566, 2.2523179054260254, 2.326895236968994, 2.401472806930542, 2.4760501384735107, 2.5506277084350586, 2.6252050399780273, 2.699782609939575, 2.774359941482544, 2.848937511444092, 2.9235148429870605, 2.9980921745300293, 3.072669506072998, 3.147247076034546, 3.2218244075775146, 3.2964019775390625, 3.3709793090820312, 3.445556879043579, 3.520134210586548, 3.5947117805480957]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 5.0, 3.0, 6.0, 8.0, 2.0, 10.0, 10.0, 31.0, 23.0, 36.0, 57.0, 73.0, 87.0, 103.0, 88.0, 94.0, 85.0, 57.0, 56.0, 47.0, 40.0, 25.0, 19.0, 9.0, 14.0, 4.0, 5.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0531800985336304, -1.0190048217773438, -0.9848296642303467, -0.9506543874740601, -0.9164791703224182, -0.8823039531707764, -0.8481286764144897, -0.8139534592628479, -0.779778242111206, -0.7456030249595642, -0.7114278078079224, -0.6772525310516357, -0.6430773138999939, -0.608902096748352, -0.5747268199920654, -0.5405516028404236, -0.5063763856887817, -0.4722011685371399, -0.43802592158317566, -0.4038506746292114, -0.3696754574775696, -0.33550024032592773, -0.3013249933719635, -0.26714974641799927, -0.23297452926635742, -0.19879929721355438, -0.16462406516075134, -0.1304488331079483, -0.09627360105514526, -0.062098369002342224, -0.027923136949539185, 0.006252095103263855, 0.040427446365356445, 0.07460267841815948, 0.10877791047096252, 0.14295314252376556, 0.1771283745765686, 0.21130360662937164, 0.24547883868217468, 0.2796540856361389, 0.31382930278778076, 0.3480045199394226, 0.38217976689338684, 0.4163550138473511, 0.4505302309989929, 0.48470544815063477, 0.5188807249069214, 0.5530559420585632, 0.5872311592102051, 0.6214063763618469, 0.6555815935134888, 0.6897568702697754, 0.7239320874214172, 0.7581073045730591, 0.7922825813293457, 0.8264577984809875, 0.8606330156326294, 0.8948082327842712, 0.9289834499359131, 0.9631587266921997, 0.9973339438438416, 1.0315091609954834, 1.06568443775177, 1.099859595298767, 1.1340348720550537]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 6.0, 4.0, 15.0, 22.0, 41.0, 52.0, 73.0, 124.0, 136.0, 233.0, 359.0, 625.0, 1073.0, 1709.0, 3017.0, 6392.0, 18105.0, 80523.0, 3631899.0, 386089.0, 38859.0, 12218.0, 5221.0, 2633.0, 1518.0, 998.0, 664.0, 487.0, 299.0, 245.0, 165.0, 118.0, 101.0, 62.0, 38.0, 30.0, 24.0, 20.0, 17.0, 11.0, 9.0, 13.0, 6.0, 8.0, 7.0, 7.0, 3.0, 2.0, 2.0, 4.0, 2.0, 0.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.276123046875, -0.26451873779296875, -0.2529144287109375, -0.24131011962890625, -0.229705810546875, -0.21810150146484375, -0.2064971923828125, -0.19489288330078125, -0.18328857421875, -0.17168426513671875, -0.1600799560546875, -0.14847564697265625, -0.136871337890625, -0.12526702880859375, -0.1136627197265625, -0.10205841064453125, -0.0904541015625, -0.07884979248046875, -0.0672454833984375, -0.05564117431640625, -0.044036865234375, -0.03243255615234375, -0.0208282470703125, -0.00922393798828125, 0.00238037109375, 0.01398468017578125, 0.0255889892578125, 0.03719329833984375, 0.048797607421875, 0.06040191650390625, 0.0720062255859375, 0.08361053466796875, 0.09521484375, 0.10681915283203125, 0.1184234619140625, 0.13002777099609375, 0.141632080078125, 0.15323638916015625, 0.1648406982421875, 0.17644500732421875, 0.18804931640625, 0.19965362548828125, 0.2112579345703125, 0.22286224365234375, 0.234466552734375, 0.24607086181640625, 0.2576751708984375, 0.26927947998046875, 0.2808837890625, 0.29248809814453125, 0.3040924072265625, 0.31569671630859375, 0.327301025390625, 0.33890533447265625, 0.3505096435546875, 0.36211395263671875, 0.37371826171875, 0.38532257080078125, 0.3969268798828125, 0.40853118896484375, 0.420135498046875, 0.43173980712890625, 0.4433441162109375, 0.45494842529296875, 0.466552734375]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 7.0, 1.0, 2.0, 4.0, 4.0, 10.0, 10.0, 14.0, 15.0, 19.0, 34.0, 70.0, 117.0, 192.0, 191.0, 128.0, 57.0, 34.0, 22.0, 17.0, 11.0, 10.0, 7.0, 10.0, 5.0, 2.0, 6.0, 2.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.027313232421875, -0.026135921478271484, -0.02495861053466797, -0.023781299591064453, -0.022603988647460938, -0.021426677703857422, -0.020249366760253906, -0.01907205581665039, -0.017894744873046875, -0.01671743392944336, -0.015540122985839844, -0.014362812042236328, -0.013185501098632812, -0.012008190155029297, -0.010830879211425781, -0.009653568267822266, -0.00847625732421875, -0.007298946380615234, -0.006121635437011719, -0.004944324493408203, -0.0037670135498046875, -0.002589702606201172, -0.0014123916625976562, -0.00023508071899414062, 0.000942230224609375, 0.0021195411682128906, 0.0032968521118164062, 0.004474163055419922, 0.0056514739990234375, 0.006828784942626953, 0.008006095886230469, 0.009183406829833984, 0.0103607177734375, 0.011538028717041016, 0.012715339660644531, 0.013892650604248047, 0.015069961547851562, 0.016247272491455078, 0.017424583435058594, 0.01860189437866211, 0.019779205322265625, 0.02095651626586914, 0.022133827209472656, 0.023311138153076172, 0.024488449096679688, 0.025665760040283203, 0.02684307098388672, 0.028020381927490234, 0.02919769287109375, 0.030375003814697266, 0.03155231475830078, 0.0327296257019043, 0.03390693664550781, 0.03508424758911133, 0.036261558532714844, 0.03743886947631836, 0.038616180419921875, 0.03979349136352539, 0.040970802307128906, 0.04214811325073242, 0.04332542419433594, 0.04450273513793945, 0.04568004608154297, 0.046857357025146484, 0.04803466796875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 2.0, 5.0, 12.0, 10.0, 12.0, 16.0, 26.0, 44.0, 84.0, 132.0, 361.0, 1006.0, 4182.0, 28231.0, 987988.0, 3119339.0, 44944.0, 5734.0, 1332.0, 400.0, 171.0, 91.0, 45.0, 37.0, 24.0, 12.0, 8.0, 7.0, 6.0, 5.0, 4.0, 1.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.4853515625, -0.4697418212890625, -0.454132080078125, -0.4385223388671875, -0.42291259765625, -0.4073028564453125, -0.391693115234375, -0.3760833740234375, -0.3604736328125, -0.3448638916015625, -0.329254150390625, -0.3136444091796875, -0.29803466796875, -0.2824249267578125, -0.266815185546875, -0.2512054443359375, -0.235595703125, -0.2199859619140625, -0.204376220703125, -0.1887664794921875, -0.17315673828125, -0.1575469970703125, -0.141937255859375, -0.1263275146484375, -0.1107177734375, -0.0951080322265625, -0.079498291015625, -0.0638885498046875, -0.04827880859375, -0.0326690673828125, -0.017059326171875, -0.0014495849609375, 0.01416015625, 0.0297698974609375, 0.045379638671875, 0.0609893798828125, 0.07659912109375, 0.0922088623046875, 0.107818603515625, 0.1234283447265625, 0.1390380859375, 0.1546478271484375, 0.170257568359375, 0.1858673095703125, 0.20147705078125, 0.2170867919921875, 0.232696533203125, 0.2483062744140625, 0.263916015625, 0.2795257568359375, 0.295135498046875, 0.3107452392578125, 0.32635498046875, 0.3419647216796875, 0.357574462890625, 0.3731842041015625, 0.3887939453125, 0.4044036865234375, 0.420013427734375, 0.4356231689453125, 0.45123291015625, 0.4668426513671875, 0.482452392578125, 0.4980621337890625, 0.513671875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 6.0, 6.0, 5.0, 3.0, 9.0, 11.0, 25.0, 48.0, 43.0, 74.0, 126.0, 227.0, 399.0, 1180.0, 999.0, 374.0, 201.0, 126.0, 65.0, 38.0, 29.0, 25.0, 15.0, 10.0, 9.0, 8.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.05126953125, -0.04966545104980469, -0.048061370849609375, -0.04645729064941406, -0.04485321044921875, -0.04324913024902344, -0.041645050048828125, -0.04004096984863281, -0.0384368896484375, -0.03683280944824219, -0.035228729248046875, -0.03362464904785156, -0.03202056884765625, -0.030416488647460938, -0.028812408447265625, -0.027208328247070312, -0.025604248046875, -0.024000167846679688, -0.022396087646484375, -0.020792007446289062, -0.01918792724609375, -0.017583847045898438, -0.015979766845703125, -0.014375686645507812, -0.0127716064453125, -0.011167526245117188, -0.009563446044921875, -0.007959365844726562, -0.00635528564453125, -0.0047512054443359375, -0.003147125244140625, -0.0015430450439453125, 6.103515625e-05, 0.0016651153564453125, 0.003269195556640625, 0.0048732757568359375, 0.00647735595703125, 0.008081436157226562, 0.009685516357421875, 0.011289596557617188, 0.0128936767578125, 0.014497756958007812, 0.016101837158203125, 0.017705917358398438, 0.01930999755859375, 0.020914077758789062, 0.022518157958984375, 0.024122238159179688, 0.025726318359375, 0.027330398559570312, 0.028934478759765625, 0.030538558959960938, 0.03214263916015625, 0.03374671936035156, 0.035350799560546875, 0.03695487976074219, 0.0385589599609375, 0.04016304016113281, 0.041767120361328125, 0.04337120056152344, 0.04497528076171875, 0.04657936096191406, 0.048183441162109375, 0.04978752136230469, 0.0513916015625]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 9.0, 10.0, 21.0, 36.0, 49.0, 122.0, 194.0, 197.0, 162.0, 103.0, 52.0, 27.0, 7.0, 7.0, 3.0, 1.0, 1.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.23055657744407654, -0.2192464917898178, -0.20793640613555908, -0.19662630558013916, -0.18531623482704163, -0.1740061342716217, -0.16269604861736298, -0.15138596296310425, -0.14007587730884552, -0.1287657916545868, -0.11745570600032806, -0.10614561289548874, -0.09483552724123001, -0.08352544158697128, -0.07221534848213196, -0.06090526282787323, -0.0495951771736145, -0.038285091519355774, -0.026975002139806747, -0.01566491276025772, -0.004354827105998993, 0.006955258548259735, 0.01826535165309906, 0.029575437307357788, 0.040885522961616516, 0.052195608615875244, 0.06350569427013397, 0.0748157873749733, 0.08612587302923203, 0.09743595868349075, 0.10874605178833008, 0.1200561374425888, 0.13136622309684753, 0.14267630875110626, 0.153986394405365, 0.1652964949607849, 0.17660656571388245, 0.18791666626930237, 0.1992267519235611, 0.21053683757781982, 0.22184692323207855, 0.23315700888633728, 0.244467094540596, 0.25577718019485474, 0.26708728075027466, 0.2783973515033722, 0.2897074520587921, 0.30101752281188965, 0.31232762336730957, 0.3236377239227295, 0.334947794675827, 0.34625789523124695, 0.3575679659843445, 0.3688780665397644, 0.3801881670951843, 0.39149823784828186, 0.4028083086013794, 0.4141184091567993, 0.42542847990989685, 0.4367385804653168, 0.4480486512184143, 0.45935875177383423, 0.47066885232925415, 0.4819789230823517, 0.4932890236377716]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 8.0, 5.0, 13.0, 8.0, 17.0, 16.0, 29.0, 33.0, 40.0, 42.0, 69.0, 69.0, 75.0, 44.0, 57.0, 92.0, 61.0, 60.0, 52.0, 47.0, 30.0, 40.0, 33.0, 15.0, 9.0, 16.0, 8.0, 4.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.190393328666687, -0.18349000811576843, -0.17658667266368866, -0.16968335211277008, -0.1627800166606903, -0.15587669610977173, -0.14897337555885315, -0.14207004010677338, -0.1351667046546936, -0.12826338410377502, -0.12136004865169525, -0.11445672810077667, -0.1075533926486969, -0.10065007209777832, -0.09374674409627914, -0.08684341609477997, -0.07994009554386139, -0.07303676754236221, -0.06613343954086304, -0.05923011526465416, -0.052326787263154984, -0.04542345926165581, -0.03852013498544693, -0.031616806983947754, -0.024713478982448578, -0.017810150980949402, -0.010906824842095375, -0.004003498703241348, 0.0028998292982578278, 0.009803157299757004, 0.01670648157596588, 0.023609809577465057, 0.030513137578964233, 0.03741646558046341, 0.044319793581962585, 0.05122311785817146, 0.05812644585967064, 0.06502977013587952, 0.07193309813737869, 0.07883642613887787, 0.08573975414037704, 0.09264308214187622, 0.0995464101433754, 0.10644973814487457, 0.11335305869579315, 0.12025639414787292, 0.1271597146987915, 0.13406303524971008, 0.14096637070178986, 0.14786969125270844, 0.1547730267047882, 0.1616763472557068, 0.16857968270778656, 0.17548300325870514, 0.1823863387107849, 0.1892896592617035, 0.19619297981262207, 0.20309630036354065, 0.20999963581562042, 0.216902956366539, 0.22380629181861877, 0.23070961236953735, 0.23761293292045593, 0.2445162683725357, 0.2514196038246155]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 6.0, 10.0, 4.0, 11.0, 14.0, 32.0, 48.0, 56.0, 98.0, 150.0, 253.0, 402.0, 644.0, 1341.0, 2765.0, 6072.0, 17860.0, 80985.0, 634008.0, 250102.0, 34985.0, 10445.0, 4107.0, 1921.0, 935.0, 514.0, 302.0, 182.0, 112.0, 69.0, 55.0, 27.0, 11.0, 14.0, 11.0, 4.0, 1.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3095703125, -0.3006629943847656, -0.29175567626953125, -0.2828483581542969, -0.2739410400390625, -0.2650337219238281, -0.25612640380859375, -0.24721908569335938, -0.238311767578125, -0.22940444946289062, -0.22049713134765625, -0.21158981323242188, -0.2026824951171875, -0.19377517700195312, -0.18486785888671875, -0.17596054077148438, -0.16705322265625, -0.15814590454101562, -0.14923858642578125, -0.14033126831054688, -0.1314239501953125, -0.12251663208007812, -0.11360931396484375, -0.10470199584960938, -0.095794677734375, -0.08688735961914062, -0.07798004150390625, -0.06907272338867188, -0.0601654052734375, -0.051258087158203125, -0.04235076904296875, -0.033443450927734375, -0.0245361328125, -0.015628814697265625, -0.00672149658203125, 0.002185821533203125, 0.0110931396484375, 0.020000457763671875, 0.02890777587890625, 0.037815093994140625, 0.046722412109375, 0.055629730224609375, 0.06453704833984375, 0.07344436645507812, 0.0823516845703125, 0.09125900268554688, 0.10016632080078125, 0.10907363891601562, 0.11798095703125, 0.12688827514648438, 0.13579559326171875, 0.14470291137695312, 0.1536102294921875, 0.16251754760742188, 0.17142486572265625, 0.18033218383789062, 0.189239501953125, 0.19814682006835938, 0.20705413818359375, 0.21596145629882812, 0.2248687744140625, 0.23377609252929688, 0.24268341064453125, 0.2515907287597656, 0.260498046875]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 9.0, 5.0, 2.0, 10.0, 7.0, 13.0, 25.0, 35.0, 67.0, 122.0, 139.0, 187.0, 136.0, 89.0, 54.0, 36.0, 15.0, 16.0, 9.0, 5.0, 8.0, 3.0, 2.0, 1.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.026641845703125, -0.025508880615234375, -0.02437591552734375, -0.023242950439453125, -0.0221099853515625, -0.020977020263671875, -0.01984405517578125, -0.018711090087890625, -0.017578125, -0.016445159912109375, -0.01531219482421875, -0.014179229736328125, -0.0130462646484375, -0.011913299560546875, -0.01078033447265625, -0.009647369384765625, -0.008514404296875, -0.007381439208984375, -0.00624847412109375, -0.005115509033203125, -0.0039825439453125, -0.002849578857421875, -0.00171661376953125, -0.000583648681640625, 0.00054931640625, 0.001682281494140625, 0.00281524658203125, 0.003948211669921875, 0.0050811767578125, 0.006214141845703125, 0.00734710693359375, 0.008480072021484375, 0.009613037109375, 0.010746002197265625, 0.01187896728515625, 0.013011932373046875, 0.0141448974609375, 0.015277862548828125, 0.01641082763671875, 0.017543792724609375, 0.0186767578125, 0.019809722900390625, 0.02094268798828125, 0.022075653076171875, 0.0232086181640625, 0.024341583251953125, 0.02547454833984375, 0.026607513427734375, 0.027740478515625, 0.028873443603515625, 0.03000640869140625, 0.031139373779296875, 0.0322723388671875, 0.033405303955078125, 0.03453826904296875, 0.035671234130859375, 0.03680419921875, 0.037937164306640625, 0.03907012939453125, 0.040203094482421875, 0.0413360595703125, 0.042469024658203125, 0.04360198974609375, 0.044734954833984375, 0.045867919921875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 0.0, 0.0, 2.0, 4.0, 5.0, 4.0, 8.0, 9.0, 8.0, 12.0, 16.0, 22.0, 23.0, 45.0, 56.0, 91.0, 110.0, 136.0, 235.0, 351.0, 608.0, 946.0, 2047.0, 5641.0, 20901.0, 99329.0, 428665.0, 379223.0, 82662.0, 17996.0, 5079.0, 1775.0, 920.0, 533.0, 331.0, 220.0, 149.0, 106.0, 66.0, 56.0, 38.0, 27.0, 34.0, 8.0, 20.0, 11.0, 8.0, 7.0, 4.0, 6.0, 1.0, 6.0, 3.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.2344970703125, -0.22758865356445312, -0.22068023681640625, -0.21377182006835938, -0.2068634033203125, -0.19995498657226562, -0.19304656982421875, -0.18613815307617188, -0.179229736328125, -0.17232131958007812, -0.16541290283203125, -0.15850448608398438, -0.1515960693359375, -0.14468765258789062, -0.13777923583984375, -0.13087081909179688, -0.12396240234375, -0.11705398559570312, -0.11014556884765625, -0.10323715209960938, -0.0963287353515625, -0.08942031860351562, -0.08251190185546875, -0.07560348510742188, -0.068695068359375, -0.061786651611328125, -0.05487823486328125, -0.047969818115234375, -0.0410614013671875, -0.034152984619140625, -0.02724456787109375, -0.020336151123046875, -0.013427734375, -0.006519317626953125, 0.00038909912109375, 0.007297515869140625, 0.0142059326171875, 0.021114349365234375, 0.02802276611328125, 0.034931182861328125, 0.041839599609375, 0.048748016357421875, 0.05565643310546875, 0.06256484985351562, 0.0694732666015625, 0.07638168334960938, 0.08329010009765625, 0.09019851684570312, 0.09710693359375, 0.10401535034179688, 0.11092376708984375, 0.11783218383789062, 0.1247406005859375, 0.13164901733398438, 0.13855743408203125, 0.14546585083007812, 0.152374267578125, 0.15928268432617188, 0.16619110107421875, 0.17309951782226562, 0.1800079345703125, 0.18691635131835938, 0.19382476806640625, 0.20073318481445312, 0.2076416015625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 4.0, 3.0, 4.0, 8.0, 8.0, 14.0, 20.0, 12.0, 22.0, 33.0, 26.0, 31.0, 32.0, 44.0, 38.0, 32.0, 48.0, 42.0, 50.0, 53.0, 36.0, 37.0, 45.0, 41.0, 43.0, 39.0, 29.0, 24.0, 28.0, 22.0, 21.0, 18.0, 18.0, 14.0, 15.0, 6.0, 9.0, 6.0, 6.0, 0.0, 4.0, 7.0, 5.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.104736328125, -0.1015481948852539, -0.09836006164550781, -0.09517192840576172, -0.09198379516601562, -0.08879566192626953, -0.08560752868652344, -0.08241939544677734, -0.07923126220703125, -0.07604312896728516, -0.07285499572753906, -0.06966686248779297, -0.06647872924804688, -0.06329059600830078, -0.06010246276855469, -0.056914329528808594, -0.0537261962890625, -0.050538063049316406, -0.04734992980957031, -0.04416179656982422, -0.040973663330078125, -0.03778553009033203, -0.03459739685058594, -0.031409263610839844, -0.02822113037109375, -0.025032997131347656, -0.021844863891601562, -0.01865673065185547, -0.015468597412109375, -0.012280464172363281, -0.009092330932617188, -0.005904197692871094, -0.002716064453125, 0.00047206878662109375, 0.0036602020263671875, 0.006848335266113281, 0.010036468505859375, 0.013224601745605469, 0.016412734985351562, 0.019600868225097656, 0.02278900146484375, 0.025977134704589844, 0.029165267944335938, 0.03235340118408203, 0.035541534423828125, 0.03872966766357422, 0.04191780090332031, 0.045105934143066406, 0.0482940673828125, 0.051482200622558594, 0.05467033386230469, 0.05785846710205078, 0.061046600341796875, 0.06423473358154297, 0.06742286682128906, 0.07061100006103516, 0.07379913330078125, 0.07698726654052734, 0.08017539978027344, 0.08336353302001953, 0.08655166625976562, 0.08973979949951172, 0.09292793273925781, 0.0961160659790039, 0.09930419921875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 3.0, 1.0, 11.0, 14.0, 19.0, 39.0, 49.0, 98.0, 147.0, 283.0, 577.0, 1304.0, 3469.0, 10326.0, 35400.0, 138259.0, 448897.0, 302546.0, 76231.0, 20347.0, 6317.0, 2298.0, 936.0, 411.0, 244.0, 128.0, 77.0, 29.0, 27.0, 17.0, 13.0, 11.0, 9.0, 9.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.133056640625, -0.12873458862304688, -0.12441253662109375, -0.12009048461914062, -0.1157684326171875, -0.11144638061523438, -0.10712432861328125, -0.10280227661132812, -0.098480224609375, -0.09415817260742188, -0.08983612060546875, -0.08551406860351562, -0.0811920166015625, -0.07686996459960938, -0.07254791259765625, -0.06822586059570312, -0.06390380859375, -0.059581756591796875, -0.05525970458984375, -0.050937652587890625, -0.0466156005859375, -0.042293548583984375, -0.03797149658203125, -0.033649444580078125, -0.029327392578125, -0.025005340576171875, -0.02068328857421875, -0.016361236572265625, -0.0120391845703125, -0.007717132568359375, -0.00339508056640625, 0.000926971435546875, 0.0052490234375, 0.009571075439453125, 0.01389312744140625, 0.018215179443359375, 0.0225372314453125, 0.026859283447265625, 0.03118133544921875, 0.035503387451171875, 0.039825439453125, 0.044147491455078125, 0.04846954345703125, 0.052791595458984375, 0.0571136474609375, 0.061435699462890625, 0.06575775146484375, 0.07007980346679688, 0.07440185546875, 0.07872390747070312, 0.08304595947265625, 0.08736801147460938, 0.0916900634765625, 0.09601211547851562, 0.10033416748046875, 0.10465621948242188, 0.108978271484375, 0.11330032348632812, 0.11762237548828125, 0.12194442749023438, 0.1262664794921875, 0.13058853149414062, 0.13491058349609375, 0.13923263549804688, 0.1435546875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 12.0, 4.0, 7.0, 13.0, 12.0, 26.0, 32.0, 53.0, 58.0, 76.0, 97.0, 102.0, 126.0, 101.0, 81.0, 78.0, 40.0, 26.0, 18.0, 16.0, 10.0, 5.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001957416534423828, -0.0001909509301185608, -0.00018616020679473877, -0.00018136948347091675, -0.00017657876014709473, -0.0001717880368232727, -0.00016699731349945068, -0.00016220659017562866, -0.00015741586685180664, -0.00015262514352798462, -0.0001478344202041626, -0.00014304369688034058, -0.00013825297355651855, -0.00013346225023269653, -0.0001286715269088745, -0.0001238808035850525, -0.00011909008026123047, -0.00011429935693740845, -0.00010950863361358643, -0.0001047179102897644, -9.992718696594238e-05, -9.513646364212036e-05, -9.034574031829834e-05, -8.555501699447632e-05, -8.07642936706543e-05, -7.597357034683228e-05, -7.118284702301025e-05, -6.639212369918823e-05, -6.160140037536621e-05, -5.681067705154419e-05, -5.201995372772217e-05, -4.7229230403900146e-05, -4.2438507080078125e-05, -3.7647783756256104e-05, -3.285706043243408e-05, -2.806633710861206e-05, -2.327561378479004e-05, -1.8484890460968018e-05, -1.3694167137145996e-05, -8.903443813323975e-06, -4.112720489501953e-06, 6.780028343200684e-07, 5.46872615814209e-06, 1.0259449481964111e-05, 1.5050172805786133e-05, 1.9840896129608154e-05, 2.4631619453430176e-05, 2.9422342777252197e-05, 3.421306610107422e-05, 3.900378942489624e-05, 4.379451274871826e-05, 4.858523607254028e-05, 5.3375959396362305e-05, 5.8166682720184326e-05, 6.295740604400635e-05, 6.774812936782837e-05, 7.253885269165039e-05, 7.732957601547241e-05, 8.212029933929443e-05, 8.691102266311646e-05, 9.170174598693848e-05, 9.64924693107605e-05, 0.00010128319263458252, 0.00010607391595840454, 0.00011086463928222656]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 7.0, 3.0, 12.0, 9.0, 18.0, 38.0, 45.0, 95.0, 176.0, 330.0, 785.0, 1996.0, 8084.0, 64900.0, 684823.0, 259438.0, 21568.0, 3944.0, 1227.0, 512.0, 220.0, 135.0, 79.0, 39.0, 25.0, 15.0, 10.0, 8.0, 3.0, 6.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2010498046875, -0.1929302215576172, -0.18481063842773438, -0.17669105529785156, -0.16857147216796875, -0.16045188903808594, -0.15233230590820312, -0.1442127227783203, -0.1360931396484375, -0.1279735565185547, -0.11985397338867188, -0.11173439025878906, -0.10361480712890625, -0.09549522399902344, -0.08737564086914062, -0.07925605773925781, -0.071136474609375, -0.06301689147949219, -0.054897308349609375, -0.04677772521972656, -0.03865814208984375, -0.030538558959960938, -0.022418975830078125, -0.014299392700195312, -0.0061798095703125, 0.0019397735595703125, 0.010059356689453125, 0.018178939819335938, 0.02629852294921875, 0.03441810607910156, 0.042537689208984375, 0.05065727233886719, 0.05877685546875, 0.06689643859863281, 0.07501602172851562, 0.08313560485839844, 0.09125518798828125, 0.09937477111816406, 0.10749435424804688, 0.11561393737792969, 0.1237335205078125, 0.1318531036376953, 0.13997268676757812, 0.14809226989746094, 0.15621185302734375, 0.16433143615722656, 0.17245101928710938, 0.1805706024169922, 0.188690185546875, 0.1968097686767578, 0.20492935180664062, 0.21304893493652344, 0.22116851806640625, 0.22928810119628906, 0.23740768432617188, 0.2455272674560547, 0.2536468505859375, 0.2617664337158203, 0.2698860168457031, 0.27800559997558594, 0.28612518310546875, 0.29424476623535156, 0.3023643493652344, 0.3104839324951172, 0.318603515625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 7.0, 1.0, 5.0, 7.0, 10.0, 25.0, 29.0, 43.0, 40.0, 80.0, 109.0, 119.0, 112.0, 121.0, 86.0, 60.0, 42.0, 29.0, 24.0, 17.0, 8.0, 10.0, 9.0, 4.0, 1.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09344482421875, -0.0897531509399414, -0.08606147766113281, -0.08236980438232422, -0.07867813110351562, -0.07498645782470703, -0.07129478454589844, -0.06760311126708984, -0.06391143798828125, -0.060219764709472656, -0.05652809143066406, -0.05283641815185547, -0.049144744873046875, -0.04545307159423828, -0.04176139831542969, -0.038069725036621094, -0.0343780517578125, -0.030686378479003906, -0.026994705200195312, -0.02330303192138672, -0.019611358642578125, -0.01591968536376953, -0.012228012084960938, -0.008536338806152344, -0.00484466552734375, -0.0011529922485351562, 0.0025386810302734375, 0.006230354309082031, 0.009922027587890625, 0.013613700866699219, 0.017305374145507812, 0.020997047424316406, 0.024688720703125, 0.028380393981933594, 0.03207206726074219, 0.03576374053955078, 0.039455413818359375, 0.04314708709716797, 0.04683876037597656, 0.050530433654785156, 0.05422210693359375, 0.057913780212402344, 0.06160545349121094, 0.06529712677001953, 0.06898880004882812, 0.07268047332763672, 0.07637214660644531, 0.0800638198852539, 0.0837554931640625, 0.0874471664428711, 0.09113883972167969, 0.09483051300048828, 0.09852218627929688, 0.10221385955810547, 0.10590553283691406, 0.10959720611572266, 0.11328887939453125, 0.11698055267333984, 0.12067222595214844, 0.12436389923095703, 0.12805557250976562, 0.13174724578857422, 0.1354389190673828, 0.1391305923461914, 0.142822265625]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 7.0, 20.0, 166.0, 540.0, 237.0, 37.0, 8.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0903329849243164, -0.9469664096832275, -0.8035998344421387, -0.6602333188056946, -0.5168667435646057, -0.37350016832351685, -0.23013365268707275, -0.08676707744598389, 0.05659949779510498, 0.19996605813503265, 0.3433326184749603, 0.4866991639137268, 0.6300657391548157, 0.7734323143959045, 0.9167988300323486, 1.0601654052734375, 1.2035319805145264, 1.3468985557556152, 1.490265130996704, 1.633631706237793, 1.7769982814788818, 1.9203648567199707, 2.0637311935424805, 2.2070980072021484, 2.350464344024658, 2.493830919265747, 2.637197494506836, 2.780564069747925, 2.9239306449890137, 3.0672972202301025, 3.2106637954711914, 3.354030132293701, 3.497396945953369, 3.640763521194458, 3.784130096435547, 3.9274966716766357, 4.070863246917725, 4.214229583740234, 4.357596397399902, 4.500962734222412, 4.64432954788208, 4.78769588470459, 4.931062698364258, 5.074429035186768, 5.2177958488464355, 5.361162185668945, 5.504528999328613, 5.647895336151123, 5.791261672973633, 5.934628009796143, 6.0779948234558105, 6.22136116027832, 6.364727973937988, 6.508094310760498, 6.651461124420166, 6.794827461242676, 6.938194274902344, 7.0815606117248535, 7.2249274253845215, 7.368293762207031, 7.511660575866699, 7.655026912689209, 7.798393726348877, 7.941760063171387, 8.085126876831055]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 1.0, 2.0, 2.0, 6.0, 6.0, 8.0, 13.0, 16.0, 17.0, 13.0, 23.0, 21.0, 30.0, 31.0, 31.0, 40.0, 49.0, 44.0, 46.0, 46.0, 58.0, 50.0, 53.0, 45.0, 49.0, 33.0, 28.0, 42.0, 29.0, 29.0, 25.0, 24.0, 22.0, 14.0, 19.0, 8.0, 6.0, 11.0, 1.0, 5.0, 5.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.8151053190231323, -0.7894560694694519, -0.7638068199157715, -0.7381575107574463, -0.7125082612037659, -0.6868590116500854, -0.6612097024917603, -0.6355604529380798, -0.6099112033843994, -0.584261953830719, -0.5586127042770386, -0.5329633951187134, -0.507314145565033, -0.48166489601135254, -0.45601561665534973, -0.4303663372993469, -0.4047170877456665, -0.3790678381919861, -0.3534185588359833, -0.32776927947998047, -0.30212002992630005, -0.27647078037261963, -0.2508215010166168, -0.2251722365617752, -0.1995229721069336, -0.17387370765209198, -0.14822444319725037, -0.12257517874240875, -0.09692591428756714, -0.07127664983272552, -0.04562738537788391, -0.019978120923042297, 0.005671143531799316, 0.03132040798664093, 0.056969672441482544, 0.08261893689632416, 0.10826820135116577, 0.13391746580600739, 0.159566730260849, 0.1852159947156906, 0.21086525917053223, 0.23651452362537384, 0.26216378808021545, 0.28781306743621826, 0.3134623169898987, 0.3391115665435791, 0.3647608458995819, 0.3904101252555847, 0.41605937480926514, 0.44170862436294556, 0.46735790371894836, 0.49300718307495117, 0.5186564326286316, 0.544305682182312, 0.5699549913406372, 0.5956042408943176, 0.621253490447998, 0.6469027400016785, 0.6725519895553589, 0.6982012987136841, 0.7238505482673645, 0.7494997978210449, 0.7751491069793701, 0.8007983565330505, 0.826447606086731]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 8.0, 8.0, 14.0, 14.0, 33.0, 57.0, 113.0, 252.0, 673.0, 1964.0, 9694.0, 146721.0, 3978404.0, 46697.0, 6299.0, 1818.0, 719.0, 331.0, 175.0, 113.0, 58.0, 42.0, 18.0, 13.0, 12.0, 11.0, 9.0, 4.0, 2.0, 5.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53125, -0.5094223022460938, -0.4875946044921875, -0.46576690673828125, -0.443939208984375, -0.42211151123046875, -0.4002838134765625, -0.37845611572265625, -0.35662841796875, -0.33480072021484375, -0.3129730224609375, -0.29114532470703125, -0.269317626953125, -0.24748992919921875, -0.2256622314453125, -0.20383453369140625, -0.1820068359375, -0.16017913818359375, -0.1383514404296875, -0.11652374267578125, -0.094696044921875, -0.07286834716796875, -0.0510406494140625, -0.02921295166015625, -0.00738525390625, 0.01444244384765625, 0.0362701416015625, 0.05809783935546875, 0.079925537109375, 0.10175323486328125, 0.1235809326171875, 0.14540863037109375, 0.167236328125, 0.18906402587890625, 0.2108917236328125, 0.23271942138671875, 0.254547119140625, 0.27637481689453125, 0.2982025146484375, 0.32003021240234375, 0.34185791015625, 0.36368560791015625, 0.3855133056640625, 0.40734100341796875, 0.429168701171875, 0.45099639892578125, 0.4728240966796875, 0.49465179443359375, 0.5164794921875, 0.5383071899414062, 0.5601348876953125, 0.5819625854492188, 0.603790283203125, 0.6256179809570312, 0.6474456787109375, 0.6692733764648438, 0.69110107421875, 0.7129287719726562, 0.7347564697265625, 0.7565841674804688, 0.778411865234375, 0.8002395629882812, 0.8220672607421875, 0.8438949584960938, 0.86572265625]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 8.0, 4.0, 5.0, 10.0, 14.0, 22.0, 32.0, 49.0, 83.0, 100.0, 115.0, 141.0, 127.0, 98.0, 52.0, 45.0, 33.0, 17.0, 15.0, 8.0, 4.0, 2.0, 5.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03192138671875, -0.03061532974243164, -0.02930927276611328, -0.028003215789794922, -0.026697158813476562, -0.025391101837158203, -0.024085044860839844, -0.022778987884521484, -0.021472930908203125, -0.020166873931884766, -0.018860816955566406, -0.017554759979248047, -0.016248703002929688, -0.014942646026611328, -0.013636589050292969, -0.01233053207397461, -0.01102447509765625, -0.00971841812133789, -0.008412361145019531, -0.007106304168701172, -0.0058002471923828125, -0.004494190216064453, -0.0031881332397460938, -0.0018820762634277344, -0.000576019287109375, 0.0007300376892089844, 0.0020360946655273438, 0.003342151641845703, 0.0046482086181640625, 0.005954265594482422, 0.007260322570800781, 0.00856637954711914, 0.0098724365234375, 0.01117849349975586, 0.012484550476074219, 0.013790607452392578, 0.015096664428710938, 0.016402721405029297, 0.017708778381347656, 0.019014835357666016, 0.020320892333984375, 0.021626949310302734, 0.022933006286621094, 0.024239063262939453, 0.025545120239257812, 0.026851177215576172, 0.02815723419189453, 0.02946329116821289, 0.03076934814453125, 0.03207540512084961, 0.03338146209716797, 0.03468751907348633, 0.03599357604980469, 0.03729963302612305, 0.038605690002441406, 0.039911746978759766, 0.041217803955078125, 0.042523860931396484, 0.043829917907714844, 0.0451359748840332, 0.04644203186035156, 0.04774808883666992, 0.04905414581298828, 0.05036020278930664, 0.051666259765625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 5.0, 5.0, 14.0, 20.0, 33.0, 42.0, 78.0, 104.0, 158.0, 284.0, 549.0, 1175.0, 2872.0, 8281.0, 32217.0, 197484.0, 3243902.0, 615722.0, 67908.0, 15114.0, 4719.0, 1777.0, 785.0, 407.0, 246.0, 134.0, 94.0, 44.0, 23.0, 30.0, 18.0, 10.0, 8.0, 4.0, 2.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.28369140625, -0.274749755859375, -0.26580810546875, -0.256866455078125, -0.2479248046875, -0.238983154296875, -0.23004150390625, -0.221099853515625, -0.212158203125, -0.203216552734375, -0.19427490234375, -0.185333251953125, -0.1763916015625, -0.167449951171875, -0.15850830078125, -0.149566650390625, -0.140625, -0.131683349609375, -0.12274169921875, -0.113800048828125, -0.1048583984375, -0.095916748046875, -0.08697509765625, -0.078033447265625, -0.069091796875, -0.060150146484375, -0.05120849609375, -0.042266845703125, -0.0333251953125, -0.024383544921875, -0.01544189453125, -0.006500244140625, 0.00244140625, 0.011383056640625, 0.02032470703125, 0.029266357421875, 0.0382080078125, 0.047149658203125, 0.05609130859375, 0.065032958984375, 0.073974609375, 0.082916259765625, 0.09185791015625, 0.100799560546875, 0.1097412109375, 0.118682861328125, 0.12762451171875, 0.136566162109375, 0.1455078125, 0.154449462890625, 0.16339111328125, 0.172332763671875, 0.1812744140625, 0.190216064453125, 0.19915771484375, 0.208099365234375, 0.217041015625, 0.225982666015625, 0.23492431640625, 0.243865966796875, 0.2528076171875, 0.261749267578125, 0.27069091796875, 0.279632568359375, 0.28857421875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 2.0, 9.0, 5.0, 4.0, 8.0, 10.0, 9.0, 25.0, 23.0, 30.0, 60.0, 107.0, 119.0, 186.0, 379.0, 1064.0, 1072.0, 367.0, 181.0, 127.0, 87.0, 57.0, 35.0, 27.0, 20.0, 10.0, 13.0, 12.0, 5.0, 2.0, 4.0, 4.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.055877685546875, -0.054131507873535156, -0.05238533020019531, -0.05063915252685547, -0.048892974853515625, -0.04714679718017578, -0.04540061950683594, -0.043654441833496094, -0.04190826416015625, -0.040162086486816406, -0.03841590881347656, -0.03666973114013672, -0.034923553466796875, -0.03317737579345703, -0.03143119812011719, -0.029685020446777344, -0.0279388427734375, -0.026192665100097656, -0.024446487426757812, -0.02270030975341797, -0.020954132080078125, -0.01920795440673828, -0.017461776733398438, -0.015715599060058594, -0.01396942138671875, -0.012223243713378906, -0.010477066040039062, -0.008730888366699219, -0.006984710693359375, -0.005238533020019531, -0.0034923553466796875, -0.0017461776733398438, 0.0, 0.0017461776733398438, 0.0034923553466796875, 0.005238533020019531, 0.006984710693359375, 0.008730888366699219, 0.010477066040039062, 0.012223243713378906, 0.01396942138671875, 0.015715599060058594, 0.017461776733398438, 0.01920795440673828, 0.020954132080078125, 0.02270030975341797, 0.024446487426757812, 0.026192665100097656, 0.0279388427734375, 0.029685020446777344, 0.03143119812011719, 0.03317737579345703, 0.034923553466796875, 0.03666973114013672, 0.03841590881347656, 0.040162086486816406, 0.04190826416015625, 0.043654441833496094, 0.04540061950683594, 0.04714679718017578, 0.048892974853515625, 0.05063915252685547, 0.05238533020019531, 0.054131507873535156, 0.055877685546875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 10.0, 27.0, 60.0, 160.0, 278.0, 278.0, 126.0, 45.0, 22.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.46466049551963806, -0.4400393068790436, -0.4154181480407715, -0.390796959400177, -0.3661757707595825, -0.3415546119213104, -0.31693342328071594, -0.29231226444244385, -0.26769107580184937, -0.24306990206241608, -0.2184487283229828, -0.1938275396823883, -0.16920636594295502, -0.14458519220352173, -0.11996400356292725, -0.09534282982349396, -0.07072165608406067, -0.04610047861933708, -0.021479301154613495, 0.0031418800354003906, 0.02776305377483368, 0.05238422751426697, 0.07700541615486145, 0.10162658989429474, 0.12624776363372803, 0.15086893737316132, 0.1754901111125946, 0.2001112997531891, 0.22473247349262238, 0.24935364723205566, 0.27397483587265015, 0.29859602451324463, 0.32321715354919434, 0.3478383421897888, 0.3724595010280609, 0.3970806896686554, 0.4217018485069275, 0.446323037147522, 0.47094422578811646, 0.49556541442871094, 0.5201865434646606, 0.5448077321052551, 0.5694289207458496, 0.5940500497817993, 0.6186712384223938, 0.6432924270629883, 0.6679136157035828, 0.6925348043441772, 0.7171559929847717, 0.7417771816253662, 0.7663983702659607, 0.7910195589065552, 0.8156406879425049, 0.8402618765830994, 0.8648830652236938, 0.8895042538642883, 0.9141254425048828, 0.9387466311454773, 0.9633678197860718, 0.9879889488220215, 1.0126101970672607, 1.0372313261032104, 1.0618524551391602, 1.0864737033843994, 1.1110948324203491]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 10.0, 12.0, 10.0, 13.0, 15.0, 30.0, 36.0, 27.0, 37.0, 40.0, 34.0, 59.0, 43.0, 50.0, 47.0, 59.0, 46.0, 47.0, 45.0, 52.0, 54.0, 47.0, 35.0, 26.0, 24.0, 28.0, 22.0, 15.0, 11.0, 9.0, 7.0, 7.0, 5.0, 3.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.21724176406860352, -0.20990778505802155, -0.20257382094860077, -0.1952398419380188, -0.18790587782859802, -0.18057189881801605, -0.17323791980743408, -0.1659039556980133, -0.15856999158859253, -0.15123601257801056, -0.14390204846858978, -0.1365680694580078, -0.12923410534858704, -0.12190012633800507, -0.11456615477800369, -0.10723218321800232, -0.09989820420742035, -0.09256423264741898, -0.0852302610874176, -0.07789628207683563, -0.07056231796741486, -0.06322833895683289, -0.05589436739683151, -0.04856039583683014, -0.041226424276828766, -0.03389245271682739, -0.02655847929418087, -0.019224505871534348, -0.011890534311532974, -0.004556562751531601, 0.002777412533760071, 0.010111384093761444, 0.017445355653762817, 0.02477932721376419, 0.032113298773765564, 0.039447274059057236, 0.04678124561905861, 0.05411521717905998, 0.061449192464351654, 0.06878316402435303, 0.0761171355843544, 0.08345110714435577, 0.09078507870435715, 0.09811905026435852, 0.10545302927494049, 0.11278699338436127, 0.12012097239494324, 0.127454936504364, 0.13478891551494598, 0.14212289452552795, 0.14945685863494873, 0.1567908376455307, 0.16412480175495148, 0.17145878076553345, 0.17879274487495422, 0.1861267238855362, 0.19346070289611816, 0.20079468190670013, 0.2081286460161209, 0.21546262502670288, 0.22279658913612366, 0.23013056814670563, 0.2374645471572876, 0.24479851126670837, 0.25213247537612915]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 7.0, 5.0, 6.0, 11.0, 21.0, 27.0, 46.0, 72.0, 103.0, 194.0, 328.0, 602.0, 1051.0, 2283.0, 5206.0, 16183.0, 71798.0, 368521.0, 454566.0, 95551.0, 20430.0, 6194.0, 2545.0, 1206.0, 633.0, 393.0, 230.0, 129.0, 78.0, 41.0, 30.0, 19.0, 12.0, 12.0, 5.0, 4.0, 5.0, 5.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.246826171875, -0.2391338348388672, -0.23144149780273438, -0.22374916076660156, -0.21605682373046875, -0.20836448669433594, -0.20067214965820312, -0.1929798126220703, -0.1852874755859375, -0.1775951385498047, -0.16990280151367188, -0.16221046447753906, -0.15451812744140625, -0.14682579040527344, -0.13913345336914062, -0.1314411163330078, -0.123748779296875, -0.11605644226074219, -0.10836410522460938, -0.10067176818847656, -0.09297943115234375, -0.08528709411621094, -0.07759475708007812, -0.06990242004394531, -0.0622100830078125, -0.05451774597167969, -0.046825408935546875, -0.03913307189941406, -0.03144073486328125, -0.023748397827148438, -0.016056060791015625, -0.008363723754882812, -0.00067138671875, 0.0070209503173828125, 0.014713287353515625, 0.022405624389648438, 0.03009796142578125, 0.03779029846191406, 0.045482635498046875, 0.05317497253417969, 0.0608673095703125, 0.06855964660644531, 0.07625198364257812, 0.08394432067871094, 0.09163665771484375, 0.09932899475097656, 0.10702133178710938, 0.11471366882324219, 0.122406005859375, 0.1300983428955078, 0.13779067993164062, 0.14548301696777344, 0.15317535400390625, 0.16086769104003906, 0.16856002807617188, 0.1762523651123047, 0.1839447021484375, 0.1916370391845703, 0.19932937622070312, 0.20702171325683594, 0.21471405029296875, 0.22240638732910156, 0.23009872436523438, 0.2377910614013672, 0.2454833984375]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 5.0, 7.0, 7.0, 7.0, 10.0, 28.0, 38.0, 63.0, 82.0, 118.0, 135.0, 130.0, 103.0, 90.0, 74.0, 35.0, 26.0, 15.0, 10.0, 8.0, 3.0, 1.0, 5.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0362548828125, -0.03481149673461914, -0.03336811065673828, -0.03192472457885742, -0.030481338500976562, -0.029037952423095703, -0.027594566345214844, -0.026151180267333984, -0.024707794189453125, -0.023264408111572266, -0.021821022033691406, -0.020377635955810547, -0.018934249877929688, -0.017490863800048828, -0.01604747772216797, -0.01460409164428711, -0.01316070556640625, -0.01171731948852539, -0.010273933410644531, -0.008830547332763672, -0.0073871612548828125, -0.005943775177001953, -0.004500389099121094, -0.0030570030212402344, -0.001613616943359375, -0.00017023086547851562, 0.0012731552124023438, 0.002716541290283203, 0.0041599273681640625, 0.005603313446044922, 0.007046699523925781, 0.00849008560180664, 0.0099334716796875, 0.01137685775756836, 0.012820243835449219, 0.014263629913330078, 0.015707015991210938, 0.017150402069091797, 0.018593788146972656, 0.020037174224853516, 0.021480560302734375, 0.022923946380615234, 0.024367332458496094, 0.025810718536376953, 0.027254104614257812, 0.028697490692138672, 0.03014087677001953, 0.03158426284790039, 0.03302764892578125, 0.03447103500366211, 0.03591442108154297, 0.03735780715942383, 0.03880119323730469, 0.04024457931518555, 0.041687965393066406, 0.043131351470947266, 0.044574737548828125, 0.046018123626708984, 0.047461509704589844, 0.0489048957824707, 0.05034828186035156, 0.05179166793823242, 0.05323505401611328, 0.05467844009399414, 0.056121826171875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 5.0, 5.0, 10.0, 12.0, 13.0, 16.0, 32.0, 34.0, 53.0, 89.0, 111.0, 142.0, 206.0, 392.0, 528.0, 1079.0, 2285.0, 7582.0, 35144.0, 185977.0, 563383.0, 200692.0, 37642.0, 7719.0, 2502.0, 1094.0, 632.0, 351.0, 256.0, 165.0, 99.0, 92.0, 51.0, 49.0, 31.0, 20.0, 21.0, 13.0, 9.0, 4.0, 6.0, 3.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.277099609375, -0.2688331604003906, -0.26056671142578125, -0.2523002624511719, -0.2440338134765625, -0.23576736450195312, -0.22750091552734375, -0.21923446655273438, -0.210968017578125, -0.20270156860351562, -0.19443511962890625, -0.18616867065429688, -0.1779022216796875, -0.16963577270507812, -0.16136932373046875, -0.15310287475585938, -0.14483642578125, -0.13656997680664062, -0.12830352783203125, -0.12003707885742188, -0.1117706298828125, -0.10350418090820312, -0.09523773193359375, -0.08697128295898438, -0.078704833984375, -0.07043838500976562, -0.06217193603515625, -0.053905487060546875, -0.0456390380859375, -0.037372589111328125, -0.02910614013671875, -0.020839691162109375, -0.0125732421875, -0.004306793212890625, 0.00395965576171875, 0.012226104736328125, 0.0204925537109375, 0.028759002685546875, 0.03702545166015625, 0.045291900634765625, 0.053558349609375, 0.061824798583984375, 0.07009124755859375, 0.07835769653320312, 0.0866241455078125, 0.09489059448242188, 0.10315704345703125, 0.11142349243164062, 0.11968994140625, 0.12795639038085938, 0.13622283935546875, 0.14448928833007812, 0.1527557373046875, 0.16102218627929688, 0.16928863525390625, 0.17755508422851562, 0.185821533203125, 0.19408798217773438, 0.20235443115234375, 0.21062088012695312, 0.2188873291015625, 0.22715377807617188, 0.23542022705078125, 0.24368667602539062, 0.251953125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 2.0, 6.0, 3.0, 8.0, 6.0, 14.0, 14.0, 14.0, 11.0, 24.0, 28.0, 21.0, 29.0, 37.0, 27.0, 38.0, 41.0, 48.0, 40.0, 42.0, 36.0, 43.0, 43.0, 43.0, 49.0, 45.0, 35.0, 36.0, 29.0, 35.0, 24.0, 25.0, 32.0, 14.0, 16.0, 13.0, 10.0, 1.0, 8.0, 5.0, 3.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1168212890625, -0.11263275146484375, -0.1084442138671875, -0.10425567626953125, -0.100067138671875, -0.09587860107421875, -0.0916900634765625, -0.08750152587890625, -0.08331298828125, -0.07912445068359375, -0.0749359130859375, -0.07074737548828125, -0.066558837890625, -0.06237030029296875, -0.0581817626953125, -0.05399322509765625, -0.0498046875, -0.04561614990234375, -0.0414276123046875, -0.03723907470703125, -0.033050537109375, -0.02886199951171875, -0.0246734619140625, -0.02048492431640625, -0.01629638671875, -0.01210784912109375, -0.0079193115234375, -0.00373077392578125, 0.000457763671875, 0.00464630126953125, 0.0088348388671875, 0.01302337646484375, 0.0172119140625, 0.02140045166015625, 0.0255889892578125, 0.02977752685546875, 0.033966064453125, 0.03815460205078125, 0.0423431396484375, 0.04653167724609375, 0.05072021484375, 0.05490875244140625, 0.0590972900390625, 0.06328582763671875, 0.067474365234375, 0.07166290283203125, 0.0758514404296875, 0.08003997802734375, 0.084228515625, 0.08841705322265625, 0.0926055908203125, 0.09679412841796875, 0.100982666015625, 0.10517120361328125, 0.1093597412109375, 0.11354827880859375, 0.11773681640625, 0.12192535400390625, 0.1261138916015625, 0.13030242919921875, 0.134490966796875, 0.13867950439453125, 0.1428680419921875, 0.14705657958984375, 0.1512451171875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 6.0, 4.0, 10.0, 11.0, 16.0, 26.0, 56.0, 83.0, 90.0, 183.0, 253.0, 402.0, 615.0, 1064.0, 1795.0, 3153.0, 5992.0, 12668.0, 33084.0, 108619.0, 439013.0, 316686.0, 77593.0, 25128.0, 10346.0, 4946.0, 2700.0, 1514.0, 950.0, 554.0, 351.0, 257.0, 138.0, 79.0, 58.0, 46.0, 21.0, 17.0, 13.0, 7.0, 7.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.1522216796875, -0.14820194244384766, -0.1441822052001953, -0.14016246795654297, -0.13614273071289062, -0.13212299346923828, -0.12810325622558594, -0.1240835189819336, -0.12006378173828125, -0.1160440444946289, -0.11202430725097656, -0.10800457000732422, -0.10398483276367188, -0.09996509552001953, -0.09594535827636719, -0.09192562103271484, -0.0879058837890625, -0.08388614654541016, -0.07986640930175781, -0.07584667205810547, -0.07182693481445312, -0.06780719757080078, -0.06378746032714844, -0.059767723083496094, -0.05574798583984375, -0.051728248596191406, -0.04770851135253906, -0.04368877410888672, -0.039669036865234375, -0.03564929962158203, -0.03162956237792969, -0.027609825134277344, -0.023590087890625, -0.019570350646972656, -0.015550613403320312, -0.011530876159667969, -0.007511138916015625, -0.0034914016723632812, 0.0005283355712890625, 0.004548072814941406, 0.00856781005859375, 0.012587547302246094, 0.016607284545898438, 0.02062702178955078, 0.024646759033203125, 0.02866649627685547, 0.03268623352050781, 0.036705970764160156, 0.0407257080078125, 0.044745445251464844, 0.04876518249511719, 0.05278491973876953, 0.056804656982421875, 0.06082439422607422, 0.06484413146972656, 0.0688638687133789, 0.07288360595703125, 0.0769033432006836, 0.08092308044433594, 0.08494281768798828, 0.08896255493164062, 0.09298229217529297, 0.09700202941894531, 0.10102176666259766, 0.10504150390625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 4.0, 9.0, 4.0, 12.0, 11.0, 15.0, 27.0, 28.0, 42.0, 49.0, 63.0, 79.0, 68.0, 104.0, 83.0, 86.0, 72.0, 61.0, 46.0, 35.0, 31.0, 22.0, 10.0, 9.0, 9.0, 5.0, 4.0, 6.0, 6.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.939338684082031e-05, -7.642991840839386e-05, -7.346644997596741e-05, -7.050298154354095e-05, -6.75395131111145e-05, -6.457604467868805e-05, -6.16125762462616e-05, -5.8649107813835144e-05, -5.568563938140869e-05, -5.272217094898224e-05, -4.9758702516555786e-05, -4.6795234084129333e-05, -4.383176565170288e-05, -4.086829721927643e-05, -3.7904828786849976e-05, -3.494136035442352e-05, -3.197789192199707e-05, -2.9014423489570618e-05, -2.6050955057144165e-05, -2.3087486624717712e-05, -2.012401819229126e-05, -1.7160549759864807e-05, -1.4197081327438354e-05, -1.1233612895011902e-05, -8.27014446258545e-06, -5.306676030158997e-06, -2.343207597732544e-06, 6.202608346939087e-07, 3.5837292671203613e-06, 6.547197699546814e-06, 9.510666131973267e-06, 1.247413456439972e-05, 1.5437602996826172e-05, 1.8401071429252625e-05, 2.1364539861679077e-05, 2.432800829410553e-05, 2.7291476726531982e-05, 3.0254945158958435e-05, 3.321841359138489e-05, 3.618188202381134e-05, 3.914535045623779e-05, 4.2108818888664246e-05, 4.50722873210907e-05, 4.803575575351715e-05, 5.0999224185943604e-05, 5.3962692618370056e-05, 5.692616105079651e-05, 5.988962948322296e-05, 6.285309791564941e-05, 6.581656634807587e-05, 6.878003478050232e-05, 7.174350321292877e-05, 7.470697164535522e-05, 7.767044007778168e-05, 8.063390851020813e-05, 8.359737694263458e-05, 8.656084537506104e-05, 8.952431380748749e-05, 9.248778223991394e-05, 9.545125067234039e-05, 9.841471910476685e-05, 0.0001013781875371933, 0.00010434165596961975, 0.0001073051244020462, 0.00011026859283447266]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 3.0, 5.0, 4.0, 5.0, 4.0, 11.0, 5.0, 14.0, 16.0, 17.0, 34.0, 50.0, 93.0, 129.0, 254.0, 518.0, 1198.0, 3362.0, 11996.0, 78885.0, 745973.0, 177455.0, 20409.0, 4977.0, 1671.0, 689.0, 313.0, 147.0, 109.0, 61.0, 47.0, 27.0, 19.0, 19.0, 7.0, 8.0, 2.0, 3.0, 7.0, 4.0, 1.0, 2.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2371826171875, -0.2294483184814453, -0.22171401977539062, -0.21397972106933594, -0.20624542236328125, -0.19851112365722656, -0.19077682495117188, -0.1830425262451172, -0.1753082275390625, -0.1675739288330078, -0.15983963012695312, -0.15210533142089844, -0.14437103271484375, -0.13663673400878906, -0.12890243530273438, -0.12116813659667969, -0.113433837890625, -0.10569953918457031, -0.09796524047851562, -0.09023094177246094, -0.08249664306640625, -0.07476234436035156, -0.06702804565429688, -0.05929374694824219, -0.0515594482421875, -0.04382514953613281, -0.036090850830078125, -0.028356552124023438, -0.02062225341796875, -0.012887954711914062, -0.005153656005859375, 0.0025806427001953125, 0.01031494140625, 0.018049240112304688, 0.025783538818359375, 0.03351783752441406, 0.04125213623046875, 0.04898643493652344, 0.056720733642578125, 0.06445503234863281, 0.0721893310546875, 0.07992362976074219, 0.08765792846679688, 0.09539222717285156, 0.10312652587890625, 0.11086082458496094, 0.11859512329101562, 0.1263294219970703, 0.134063720703125, 0.1417980194091797, 0.14953231811523438, 0.15726661682128906, 0.16500091552734375, 0.17273521423339844, 0.18046951293945312, 0.1882038116455078, 0.1959381103515625, 0.2036724090576172, 0.21140670776367188, 0.21914100646972656, 0.22687530517578125, 0.23460960388183594, 0.24234390258789062, 0.2500782012939453, 0.2578125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 6.0, 6.0, 10.0, 11.0, 19.0, 20.0, 22.0, 24.0, 26.0, 31.0, 47.0, 74.0, 118.0, 127.0, 109.0, 81.0, 62.0, 44.0, 43.0, 24.0, 28.0, 9.0, 10.0, 14.0, 13.0, 5.0, 9.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09698486328125, -0.09393882751464844, -0.09089279174804688, -0.08784675598144531, -0.08480072021484375, -0.08175468444824219, -0.07870864868164062, -0.07566261291503906, -0.0726165771484375, -0.06957054138183594, -0.06652450561523438, -0.06347846984863281, -0.06043243408203125, -0.05738639831542969, -0.054340362548828125, -0.05129432678222656, -0.048248291015625, -0.04520225524902344, -0.042156219482421875, -0.03911018371582031, -0.03606414794921875, -0.03301811218261719, -0.029972076416015625, -0.026926040649414062, -0.0238800048828125, -0.020833969116210938, -0.017787933349609375, -0.014741897583007812, -0.01169586181640625, -0.008649826049804688, -0.005603790283203125, -0.0025577545166015625, 0.00048828125, 0.0035343170166015625, 0.006580352783203125, 0.009626388549804688, 0.01267242431640625, 0.015718460083007812, 0.018764495849609375, 0.021810531616210938, 0.0248565673828125, 0.027902603149414062, 0.030948638916015625, 0.03399467468261719, 0.03704071044921875, 0.04008674621582031, 0.043132781982421875, 0.04617881774902344, 0.049224853515625, 0.05227088928222656, 0.055316925048828125, 0.05836296081542969, 0.06140899658203125, 0.06445503234863281, 0.06750106811523438, 0.07054710388183594, 0.0735931396484375, 0.07663917541503906, 0.07968521118164062, 0.08273124694824219, 0.08577728271484375, 0.08882331848144531, 0.09186935424804688, 0.09491539001464844, 0.09796142578125]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 13.0, 20.0, 76.0, 204.0, 299.0, 247.0, 97.0, 32.0, 10.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6724709272384644, -1.5774142742156982, -1.4823575019836426, -1.3873008489608765, -1.2922441959381104, -1.1971874237060547, -1.1021307706832886, -1.0070741176605225, -0.9120173454284668, -0.8169606328010559, -0.721903920173645, -0.6268472671508789, -0.531790554523468, -0.43673384189605713, -0.341677188873291, -0.24662047624588013, -0.15156376361846924, -0.05650706589221954, 0.03854963183403015, 0.13360631465911865, 0.22866302728652954, 0.32371973991394043, 0.41877639293670654, 0.5138331055641174, 0.6088898181915283, 0.7039465308189392, 0.7990032434463501, 0.8940598964691162, 0.9891166090965271, 1.084173321723938, 1.179229974746704, 1.2742867469787598, 1.3693432807922363, 1.4643999338150024, 1.559456706047058, 1.6545133590698242, 1.7495701313018799, 1.844626784324646, 1.939683437347412, 2.0347402095794678, 2.1297969818115234, 2.224853754043579, 2.3199102878570557, 2.4149670600891113, 2.510023832321167, 2.6050806045532227, 2.700137138366699, 2.795193910598755, 2.8902504444122314, 2.985307216644287, 3.0803637504577637, 3.1754205226898193, 3.270477294921875, 3.3655338287353516, 3.4605906009674072, 3.555647373199463, 3.6507039070129395, 3.745760679244995, 3.8408172130584717, 3.9358739852905273, 4.030930519104004, 4.125987529754639, 4.221044063568115, 4.316100597381592, 4.411157608032227]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 3.0, 6.0, 2.0, 12.0, 5.0, 8.0, 9.0, 10.0, 14.0, 12.0, 17.0, 21.0, 24.0, 26.0, 27.0, 40.0, 47.0, 30.0, 44.0, 36.0, 31.0, 46.0, 37.0, 37.0, 34.0, 36.0, 43.0, 40.0, 40.0, 41.0, 34.0, 41.0, 21.0, 27.0, 20.0, 10.0, 8.0, 10.0, 8.0, 13.0, 7.0, 5.0, 8.0, 5.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.8363328576087952, -0.8103107213973999, -0.7842886447906494, -0.7582665085792542, -0.7322444319725037, -0.7062222957611084, -0.6802002191543579, -0.6541780829429626, -0.6281559467315674, -0.6021338105201721, -0.5761117339134216, -0.5500895977020264, -0.5240675210952759, -0.4980453848838806, -0.47202327847480774, -0.44600117206573486, -0.4199790954589844, -0.3939569890499115, -0.3679348826408386, -0.34191274642944336, -0.31589066982269287, -0.2898685336112976, -0.26384642720222473, -0.23782432079315186, -0.21180221438407898, -0.1857801079750061, -0.15975800156593323, -0.13373588025569916, -0.10771377384662628, -0.0816916674375534, -0.055669546127319336, -0.02964743971824646, -0.0036252737045288086, 0.022396836429834366, 0.04841894656419754, 0.07444106042385101, 0.10046316683292389, 0.12648527324199677, 0.15250739455223083, 0.1785295009613037, 0.2045516073703766, 0.23057371377944946, 0.25659582018852234, 0.2826179265975952, 0.3086400628089905, 0.33466213941574097, 0.36068427562713623, 0.3867063820362091, 0.412728488445282, 0.43875059485435486, 0.46477270126342773, 0.490794837474823, 0.5168169140815735, 0.5428390502929688, 0.5688611268997192, 0.5948832631111145, 0.6209053993225098, 0.646927535533905, 0.6729496121406555, 0.6989717483520508, 0.7249938249588013, 0.7510159611701965, 0.7770380973815918, 0.8030601739883423, 0.8290822505950928]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 9.0, 16.0, 16.0, 51.0, 95.0, 196.0, 427.0, 1072.0, 3697.0, 20430.0, 383433.0, 3720993.0, 53244.0, 7164.0, 1992.0, 725.0, 329.0, 161.0, 89.0, 44.0, 27.0, 27.0, 14.0, 12.0, 4.0, 3.0, 5.0, 0.0, 0.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.325439453125, -0.3125267028808594, -0.29961395263671875, -0.2867012023925781, -0.2737884521484375, -0.2608757019042969, -0.24796295166015625, -0.23505020141601562, -0.222137451171875, -0.20922470092773438, -0.19631195068359375, -0.18339920043945312, -0.1704864501953125, -0.15757369995117188, -0.14466094970703125, -0.13174819946289062, -0.11883544921875, -0.10592269897460938, -0.09300994873046875, -0.08009719848632812, -0.0671844482421875, -0.054271697998046875, -0.04135894775390625, -0.028446197509765625, -0.015533447265625, -0.002620697021484375, 0.01029205322265625, 0.023204803466796875, 0.0361175537109375, 0.049030303955078125, 0.06194305419921875, 0.07485580444335938, 0.0877685546875, 0.10068130493164062, 0.11359405517578125, 0.12650680541992188, 0.1394195556640625, 0.15233230590820312, 0.16524505615234375, 0.17815780639648438, 0.191070556640625, 0.20398330688476562, 0.21689605712890625, 0.22980880737304688, 0.2427215576171875, 0.2556343078613281, 0.26854705810546875, 0.2814598083496094, 0.29437255859375, 0.3072853088378906, 0.32019805908203125, 0.3331108093261719, 0.3460235595703125, 0.3589363098144531, 0.37184906005859375, 0.3847618103027344, 0.397674560546875, 0.4105873107910156, 0.42350006103515625, 0.4364128112792969, 0.4493255615234375, 0.4622383117675781, 0.47515106201171875, 0.4880638122558594, 0.5009765625]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 4.0, 7.0, 6.0, 8.0, 32.0, 26.0, 37.0, 66.0, 79.0, 104.0, 119.0, 104.0, 104.0, 88.0, 66.0, 46.0, 43.0, 26.0, 12.0, 10.0, 5.0, 5.0, 7.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.042327880859375, -0.04071760177612305, -0.039107322692871094, -0.03749704360961914, -0.03588676452636719, -0.034276485443115234, -0.03266620635986328, -0.031055927276611328, -0.029445648193359375, -0.027835369110107422, -0.02622509002685547, -0.024614810943603516, -0.023004531860351562, -0.02139425277709961, -0.019783973693847656, -0.018173694610595703, -0.01656341552734375, -0.014953136444091797, -0.013342857360839844, -0.01173257827758789, -0.010122299194335938, -0.008512020111083984, -0.006901741027832031, -0.005291461944580078, -0.003681182861328125, -0.002070903778076172, -0.00046062469482421875, 0.0011496543884277344, 0.0027599334716796875, 0.004370212554931641, 0.005980491638183594, 0.007590770721435547, 0.0092010498046875, 0.010811328887939453, 0.012421607971191406, 0.01403188705444336, 0.015642166137695312, 0.017252445220947266, 0.01886272430419922, 0.020473003387451172, 0.022083282470703125, 0.023693561553955078, 0.02530384063720703, 0.026914119720458984, 0.028524398803710938, 0.03013467788696289, 0.031744956970214844, 0.0333552360534668, 0.03496551513671875, 0.0365757942199707, 0.038186073303222656, 0.03979635238647461, 0.04140663146972656, 0.043016910552978516, 0.04462718963623047, 0.04623746871948242, 0.047847747802734375, 0.04945802688598633, 0.05106830596923828, 0.052678585052490234, 0.05428886413574219, 0.05589914321899414, 0.057509422302246094, 0.05911970138549805, 0.06072998046875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 1.0, 0.0, 4.0, 2.0, 3.0, 2.0, 4.0, 2.0, 9.0, 15.0, 25.0, 31.0, 47.0, 84.0, 117.0, 176.0, 382.0, 668.0, 1420.0, 3171.0, 7973.0, 23862.0, 96491.0, 664223.0, 3081002.0, 243107.0, 48746.0, 13811.0, 4756.0, 2014.0, 881.0, 511.0, 253.0, 142.0, 102.0, 84.0, 36.0, 27.0, 30.0, 17.0, 16.0, 8.0, 13.0, 4.0, 6.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.203125, -0.1970195770263672, -0.19091415405273438, -0.18480873107910156, -0.17870330810546875, -0.17259788513183594, -0.16649246215820312, -0.1603870391845703, -0.1542816162109375, -0.1481761932373047, -0.14207077026367188, -0.13596534729003906, -0.12985992431640625, -0.12375450134277344, -0.11764907836914062, -0.11154365539550781, -0.105438232421875, -0.09933280944824219, -0.09322738647460938, -0.08712196350097656, -0.08101654052734375, -0.07491111755371094, -0.06880569458007812, -0.06270027160644531, -0.0565948486328125, -0.05048942565917969, -0.044384002685546875, -0.03827857971191406, -0.03217315673828125, -0.026067733764648438, -0.019962310791015625, -0.013856887817382812, -0.00775146484375, -0.0016460418701171875, 0.004459381103515625, 0.010564804077148438, 0.01667022705078125, 0.022775650024414062, 0.028881072998046875, 0.03498649597167969, 0.0410919189453125, 0.04719734191894531, 0.053302764892578125, 0.05940818786621094, 0.06551361083984375, 0.07161903381347656, 0.07772445678710938, 0.08382987976074219, 0.089935302734375, 0.09604072570800781, 0.10214614868164062, 0.10825157165527344, 0.11435699462890625, 0.12046241760253906, 0.12656784057617188, 0.1326732635498047, 0.1387786865234375, 0.1448841094970703, 0.15098953247070312, 0.15709495544433594, 0.16320037841796875, 0.16930580139160156, 0.17541122436523438, 0.1815166473388672, 0.1876220703125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 3.0, 8.0, 7.0, 8.0, 18.0, 18.0, 29.0, 38.0, 52.0, 111.0, 188.0, 450.0, 1563.0, 870.0, 331.0, 140.0, 80.0, 65.0, 40.0, 16.0, 16.0, 14.0, 5.0, 3.0, 4.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.044189453125, -0.04195976257324219, -0.039730072021484375, -0.03750038146972656, -0.03527069091796875, -0.03304100036621094, -0.030811309814453125, -0.028581619262695312, -0.0263519287109375, -0.024122238159179688, -0.021892547607421875, -0.019662857055664062, -0.01743316650390625, -0.015203475952148438, -0.012973785400390625, -0.010744094848632812, -0.008514404296875, -0.0062847137451171875, -0.004055023193359375, -0.0018253326416015625, 0.00040435791015625, 0.0026340484619140625, 0.004863739013671875, 0.0070934295654296875, 0.0093231201171875, 0.011552810668945312, 0.013782501220703125, 0.016012191772460938, 0.01824188232421875, 0.020471572875976562, 0.022701263427734375, 0.024930953979492188, 0.02716064453125, 0.029390335083007812, 0.031620025634765625, 0.03384971618652344, 0.03607940673828125, 0.03830909729003906, 0.040538787841796875, 0.04276847839355469, 0.0449981689453125, 0.04722785949707031, 0.049457550048828125, 0.05168724060058594, 0.05391693115234375, 0.05614662170410156, 0.058376312255859375, 0.06060600280761719, 0.062835693359375, 0.06506538391113281, 0.06729507446289062, 0.06952476501464844, 0.07175445556640625, 0.07398414611816406, 0.07621383666992188, 0.07844352722167969, 0.0806732177734375, 0.08290290832519531, 0.08513259887695312, 0.08736228942871094, 0.08959197998046875, 0.09182167053222656, 0.09405136108398438, 0.09628105163574219, 0.0985107421875]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 12.0, 32.0, 67.0, 152.0, 186.0, 271.0, 164.0, 79.0, 33.0, 2.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0], "bins": [-1.0670428276062012, -1.0469731092453003, -1.0269032716751099, -1.006833553314209, -0.9867637157440186, -0.9666939377784729, -0.9466241598129272, -0.9265544414520264, -0.9064846038818359, -0.8864148259162903, -0.8663450479507446, -0.846275269985199, -0.8262054920196533, -0.8061357140541077, -0.786065936088562, -0.7659962177276611, -0.7459264397621155, -0.7258566617965698, -0.7057868838310242, -0.6857171058654785, -0.6656473278999329, -0.6455775499343872, -0.6255077719688416, -0.6054379940032959, -0.585368275642395, -0.5652984976768494, -0.5452287197113037, -0.5251589417457581, -0.5050891637802124, -0.48501938581466675, -0.4649496376514435, -0.4448798596858978, -0.4248100519180298, -0.40474027395248413, -0.3846704959869385, -0.3646007180213928, -0.34453094005584717, -0.3244611620903015, -0.30439141392707825, -0.2843216359615326, -0.2642518877983093, -0.24418210983276367, -0.22411233186721802, -0.20404256880283356, -0.1839727908372879, -0.16390301287174225, -0.1438332498073578, -0.12376347184181213, -0.10369367897510529, -0.08362390100955963, -0.06355413049459457, -0.04348435625433922, -0.023414582014083862, -0.003344804048538208, 0.01672496646642685, 0.03679473698139191, 0.05686451494693756, 0.07693429291248322, 0.09700406342744827, 0.11707383394241333, 0.13714361190795898, 0.15721338987350464, 0.1772831678390503, 0.19735293090343475, 0.2174227088689804]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 5.0, 3.0, 6.0, 7.0, 11.0, 7.0, 11.0, 6.0, 16.0, 15.0, 21.0, 16.0, 16.0, 26.0, 23.0, 22.0, 26.0, 33.0, 42.0, 36.0, 40.0, 28.0, 36.0, 37.0, 42.0, 40.0, 40.0, 30.0, 28.0, 43.0, 31.0, 35.0, 28.0, 40.0, 19.0, 17.0, 18.0, 20.0, 16.0, 9.0, 17.0, 11.0, 7.0, 9.0, 3.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.14853399991989136, -0.14352990686893463, -0.1385258138179779, -0.13352172076702118, -0.12851762771606445, -0.12351353466510773, -0.118509441614151, -0.11350534856319427, -0.10850125551223755, -0.10349716246128082, -0.0984930694103241, -0.09348897635936737, -0.08848488330841064, -0.08348079025745392, -0.07847669720649719, -0.07347260415554047, -0.06846851110458374, -0.06346441805362701, -0.05846032500267029, -0.05345623195171356, -0.048452138900756836, -0.04344804584980011, -0.038443952798843384, -0.03343985974788666, -0.02843576669692993, -0.023431673645973206, -0.01842758059501648, -0.013423487544059753, -0.008419394493103027, -0.0034153014421463013, 0.0015887916088104248, 0.006592884659767151, 0.011596977710723877, 0.016601070761680603, 0.02160516381263733, 0.026609256863594055, 0.03161334991455078, 0.03661744296550751, 0.04162153601646423, 0.04662562906742096, 0.051629722118377686, 0.05663381516933441, 0.06163790822029114, 0.06664200127124786, 0.07164609432220459, 0.07665018737316132, 0.08165428042411804, 0.08665837347507477, 0.0916624665260315, 0.09666655957698822, 0.10167065262794495, 0.10667474567890167, 0.1116788387298584, 0.11668293178081512, 0.12168702483177185, 0.12669111788272858, 0.1316952109336853, 0.13669930398464203, 0.14170339703559875, 0.14670749008655548, 0.1517115831375122, 0.15671567618846893, 0.16171976923942566, 0.16672386229038239, 0.1717279553413391]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 2.0, 6.0, 9.0, 10.0, 13.0, 21.0, 27.0, 20.0, 48.0, 78.0, 117.0, 166.0, 256.0, 411.0, 741.0, 1273.0, 2680.0, 5710.0, 13919.0, 36477.0, 100504.0, 264895.0, 358574.0, 164119.0, 59608.0, 22061.0, 8823.0, 3760.0, 1742.0, 991.0, 535.0, 357.0, 210.0, 139.0, 82.0, 52.0, 44.0, 24.0, 17.0, 13.0, 5.0, 5.0, 5.0, 1.0, 3.0, 5.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.13818359375, -0.1338977813720703, -0.12961196899414062, -0.12532615661621094, -0.12104034423828125, -0.11675453186035156, -0.11246871948242188, -0.10818290710449219, -0.1038970947265625, -0.09961128234863281, -0.09532546997070312, -0.09103965759277344, -0.08675384521484375, -0.08246803283691406, -0.07818222045898438, -0.07389640808105469, -0.069610595703125, -0.06532478332519531, -0.061038970947265625, -0.05675315856933594, -0.05246734619140625, -0.04818153381347656, -0.043895721435546875, -0.03960990905761719, -0.0353240966796875, -0.031038284301757812, -0.026752471923828125, -0.022466659545898438, -0.01818084716796875, -0.013895034790039062, -0.009609222412109375, -0.0053234100341796875, -0.00103759765625, 0.0032482147216796875, 0.007534027099609375, 0.011819839477539062, 0.01610565185546875, 0.020391464233398438, 0.024677276611328125, 0.028963088989257812, 0.0332489013671875, 0.03753471374511719, 0.041820526123046875, 0.04610633850097656, 0.05039215087890625, 0.05467796325683594, 0.058963775634765625, 0.06324958801269531, 0.067535400390625, 0.07182121276855469, 0.07610702514648438, 0.08039283752441406, 0.08467864990234375, 0.08896446228027344, 0.09325027465820312, 0.09753608703613281, 0.1018218994140625, 0.10610771179199219, 0.11039352416992188, 0.11467933654785156, 0.11896514892578125, 0.12325096130371094, 0.12753677368164062, 0.1318225860595703, 0.1361083984375]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 7.0, 3.0, 10.0, 27.0, 31.0, 36.0, 64.0, 75.0, 87.0, 102.0, 104.0, 91.0, 105.0, 75.0, 62.0, 42.0, 32.0, 14.0, 16.0, 12.0, 6.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0423583984375, -0.040711402893066406, -0.03906440734863281, -0.03741741180419922, -0.035770416259765625, -0.03412342071533203, -0.03247642517089844, -0.030829429626464844, -0.02918243408203125, -0.027535438537597656, -0.025888442993164062, -0.02424144744873047, -0.022594451904296875, -0.02094745635986328, -0.019300460815429688, -0.017653465270996094, -0.0160064697265625, -0.014359474182128906, -0.012712478637695312, -0.011065483093261719, -0.009418487548828125, -0.007771492004394531, -0.0061244964599609375, -0.004477500915527344, -0.00283050537109375, -0.0011835098266601562, 0.0004634857177734375, 0.0021104812622070312, 0.003757476806640625, 0.005404472351074219, 0.0070514678955078125, 0.008698463439941406, 0.010345458984375, 0.011992454528808594, 0.013639450073242188, 0.015286445617675781, 0.016933441162109375, 0.01858043670654297, 0.020227432250976562, 0.021874427795410156, 0.02352142333984375, 0.025168418884277344, 0.026815414428710938, 0.02846240997314453, 0.030109405517578125, 0.03175640106201172, 0.03340339660644531, 0.035050392150878906, 0.0366973876953125, 0.038344383239746094, 0.03999137878417969, 0.04163837432861328, 0.043285369873046875, 0.04493236541748047, 0.04657936096191406, 0.048226356506347656, 0.04987335205078125, 0.051520347595214844, 0.05316734313964844, 0.05481433868408203, 0.056461334228515625, 0.05810832977294922, 0.05975532531738281, 0.061402320861816406, 0.06304931640625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 3.0, 4.0, 8.0, 6.0, 8.0, 11.0, 16.0, 18.0, 28.0, 45.0, 66.0, 88.0, 133.0, 187.0, 289.0, 433.0, 689.0, 1326.0, 2681.0, 7499.0, 29396.0, 126525.0, 417563.0, 338172.0, 90917.0, 21400.0, 5962.0, 2089.0, 1130.0, 621.0, 397.0, 270.0, 180.0, 106.0, 88.0, 55.0, 42.0, 31.0, 20.0, 19.0, 16.0, 6.0, 4.0, 2.0, 4.0, 6.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1881103515625, -0.1823902130126953, -0.17667007446289062, -0.17094993591308594, -0.16522979736328125, -0.15950965881347656, -0.15378952026367188, -0.1480693817138672, -0.1423492431640625, -0.1366291046142578, -0.13090896606445312, -0.12518882751464844, -0.11946868896484375, -0.11374855041503906, -0.10802841186523438, -0.10230827331542969, -0.096588134765625, -0.09086799621582031, -0.08514785766601562, -0.07942771911621094, -0.07370758056640625, -0.06798744201660156, -0.062267303466796875, -0.05654716491699219, -0.0508270263671875, -0.04510688781738281, -0.039386749267578125, -0.03366661071777344, -0.02794647216796875, -0.022226333618164062, -0.016506195068359375, -0.010786056518554688, -0.00506591796875, 0.0006542205810546875, 0.006374359130859375, 0.012094497680664062, 0.01781463623046875, 0.023534774780273438, 0.029254913330078125, 0.03497505187988281, 0.0406951904296875, 0.04641532897949219, 0.052135467529296875, 0.05785560607910156, 0.06357574462890625, 0.06929588317871094, 0.07501602172851562, 0.08073616027832031, 0.086456298828125, 0.09217643737792969, 0.09789657592773438, 0.10361671447753906, 0.10933685302734375, 0.11505699157714844, 0.12077713012695312, 0.1264972686767578, 0.1322174072265625, 0.1379375457763672, 0.14365768432617188, 0.14937782287597656, 0.15509796142578125, 0.16081809997558594, 0.16653823852539062, 0.1722583770751953, 0.177978515625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 2.0, 4.0, 9.0, 7.0, 9.0, 11.0, 22.0, 22.0, 23.0, 29.0, 31.0, 35.0, 47.0, 52.0, 47.0, 51.0, 55.0, 68.0, 54.0, 49.0, 48.0, 40.0, 43.0, 49.0, 37.0, 23.0, 25.0, 20.0, 29.0, 18.0, 15.0, 17.0, 8.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.20166015625, -0.19617843627929688, -0.19069671630859375, -0.18521499633789062, -0.1797332763671875, -0.17425155639648438, -0.16876983642578125, -0.16328811645507812, -0.157806396484375, -0.15232467651367188, -0.14684295654296875, -0.14136123657226562, -0.1358795166015625, -0.13039779663085938, -0.12491607666015625, -0.11943435668945312, -0.11395263671875, -0.10847091674804688, -0.10298919677734375, -0.09750747680664062, -0.0920257568359375, -0.08654403686523438, -0.08106231689453125, -0.07558059692382812, -0.070098876953125, -0.06461715698242188, -0.05913543701171875, -0.053653717041015625, -0.0481719970703125, -0.042690277099609375, -0.03720855712890625, -0.031726837158203125, -0.0262451171875, -0.020763397216796875, -0.01528167724609375, -0.009799957275390625, -0.0043182373046875, 0.001163482666015625, 0.00664520263671875, 0.012126922607421875, 0.017608642578125, 0.023090362548828125, 0.02857208251953125, 0.034053802490234375, 0.0395355224609375, 0.045017242431640625, 0.05049896240234375, 0.055980682373046875, 0.06146240234375, 0.06694412231445312, 0.07242584228515625, 0.07790756225585938, 0.0833892822265625, 0.08887100219726562, 0.09435272216796875, 0.09983444213867188, 0.105316162109375, 0.11079788208007812, 0.11627960205078125, 0.12176132202148438, 0.1272430419921875, 0.13272476196289062, 0.13820648193359375, 0.14368820190429688, 0.149169921875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 5.0, 5.0, 4.0, 6.0, 12.0, 13.0, 26.0, 30.0, 34.0, 50.0, 75.0, 112.0, 193.0, 305.0, 556.0, 1117.0, 2218.0, 5114.0, 13822.0, 42803.0, 174779.0, 525355.0, 206670.0, 49318.0, 15289.0, 5687.0, 2306.0, 1109.0, 596.0, 356.0, 197.0, 126.0, 73.0, 55.0, 46.0, 21.0, 24.0, 14.0, 10.0, 7.0, 7.0, 3.0, 3.0, 2.0, 5.0, 4.0, 0.0, 0.0, 1.0], "bins": [-0.1038818359375, -0.10103988647460938, -0.09819793701171875, -0.09535598754882812, -0.0925140380859375, -0.08967208862304688, -0.08683013916015625, -0.08398818969726562, -0.081146240234375, -0.07830429077148438, -0.07546234130859375, -0.07262039184570312, -0.0697784423828125, -0.06693649291992188, -0.06409454345703125, -0.061252593994140625, -0.05841064453125, -0.055568695068359375, -0.05272674560546875, -0.049884796142578125, -0.0470428466796875, -0.044200897216796875, -0.04135894775390625, -0.038516998291015625, -0.035675048828125, -0.032833099365234375, -0.02999114990234375, -0.027149200439453125, -0.0243072509765625, -0.021465301513671875, -0.01862335205078125, -0.015781402587890625, -0.012939453125, -0.010097503662109375, -0.00725555419921875, -0.004413604736328125, -0.0015716552734375, 0.001270294189453125, 0.00411224365234375, 0.006954193115234375, 0.009796142578125, 0.012638092041015625, 0.01548004150390625, 0.018321990966796875, 0.0211639404296875, 0.024005889892578125, 0.02684783935546875, 0.029689788818359375, 0.03253173828125, 0.035373687744140625, 0.03821563720703125, 0.041057586669921875, 0.0438995361328125, 0.046741485595703125, 0.04958343505859375, 0.052425384521484375, 0.055267333984375, 0.058109283447265625, 0.06095123291015625, 0.06379318237304688, 0.0666351318359375, 0.06947708129882812, 0.07231903076171875, 0.07516098022460938, 0.0780029296875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 9.0, 7.0, 10.0, 16.0, 16.0, 41.0, 59.0, 69.0, 81.0, 104.0, 106.0, 105.0, 90.0, 82.0, 60.0, 46.0, 26.0, 25.0, 16.0, 17.0, 6.0, 3.0, 3.0, 7.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.512901306152344e-05, -9.159371256828308e-05, -8.805841207504272e-05, -8.452311158180237e-05, -8.098781108856201e-05, -7.745251059532166e-05, -7.39172101020813e-05, -7.038190960884094e-05, -6.684660911560059e-05, -6.331130862236023e-05, -5.977600812911987e-05, -5.6240707635879517e-05, -5.270540714263916e-05, -4.9170106649398804e-05, -4.563480615615845e-05, -4.209950566291809e-05, -3.8564205169677734e-05, -3.502890467643738e-05, -3.149360418319702e-05, -2.7958303689956665e-05, -2.442300319671631e-05, -2.0887702703475952e-05, -1.7352402210235596e-05, -1.381710171699524e-05, -1.0281801223754883e-05, -6.746500730514526e-06, -3.21120023727417e-06, 3.241002559661865e-07, 3.859400749206543e-06, 7.394701242446899e-06, 1.0930001735687256e-05, 1.4465302228927612e-05, 1.800060272216797e-05, 2.1535903215408325e-05, 2.507120370864868e-05, 2.8606504201889038e-05, 3.2141804695129395e-05, 3.567710518836975e-05, 3.921240568161011e-05, 4.2747706174850464e-05, 4.628300666809082e-05, 4.981830716133118e-05, 5.335360765457153e-05, 5.688890814781189e-05, 6.0424208641052246e-05, 6.39595091342926e-05, 6.749480962753296e-05, 7.103011012077332e-05, 7.456541061401367e-05, 7.810071110725403e-05, 8.163601160049438e-05, 8.517131209373474e-05, 8.87066125869751e-05, 9.224191308021545e-05, 9.577721357345581e-05, 9.931251406669617e-05, 0.00010284781455993652, 0.00010638311505317688, 0.00010991841554641724, 0.00011345371603965759, 0.00011698901653289795, 0.0001205243170261383, 0.00012405961751937866, 0.00012759491801261902, 0.00013113021850585938]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 9.0, 9.0, 13.0, 16.0, 27.0, 46.0, 50.0, 77.0, 96.0, 159.0, 266.0, 556.0, 1032.0, 2601.0, 7397.0, 29020.0, 159586.0, 658606.0, 149375.0, 27313.0, 7423.0, 2547.0, 1069.0, 464.0, 312.0, 165.0, 101.0, 64.0, 39.0, 32.0, 19.0, 21.0, 22.0, 6.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0966796875, -0.09288597106933594, -0.08909225463867188, -0.08529853820800781, -0.08150482177734375, -0.07771110534667969, -0.07391738891601562, -0.07012367248535156, -0.0663299560546875, -0.06253623962402344, -0.058742523193359375, -0.05494880676269531, -0.05115509033203125, -0.04736137390136719, -0.043567657470703125, -0.03977394104003906, -0.035980224609375, -0.03218650817871094, -0.028392791748046875, -0.024599075317382812, -0.02080535888671875, -0.017011642456054688, -0.013217926025390625, -0.009424209594726562, -0.0056304931640625, -0.0018367767333984375, 0.001956939697265625, 0.0057506561279296875, 0.00954437255859375, 0.013338088989257812, 0.017131805419921875, 0.020925521850585938, 0.02471923828125, 0.028512954711914062, 0.032306671142578125, 0.03610038757324219, 0.03989410400390625, 0.04368782043457031, 0.047481536865234375, 0.05127525329589844, 0.0550689697265625, 0.05886268615722656, 0.06265640258789062, 0.06645011901855469, 0.07024383544921875, 0.07403755187988281, 0.07783126831054688, 0.08162498474121094, 0.085418701171875, 0.08921241760253906, 0.09300613403320312, 0.09679985046386719, 0.10059356689453125, 0.10438728332519531, 0.10818099975585938, 0.11197471618652344, 0.1157684326171875, 0.11956214904785156, 0.12335586547851562, 0.1271495819091797, 0.13094329833984375, 0.1347370147705078, 0.13853073120117188, 0.14232444763183594, 0.1461181640625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 3.0, 1.0, 4.0, 2.0, 4.0, 3.0, 7.0, 6.0, 5.0, 11.0, 13.0, 15.0, 23.0, 29.0, 49.0, 58.0, 71.0, 87.0, 101.0, 88.0, 86.0, 69.0, 68.0, 58.0, 34.0, 22.0, 19.0, 15.0, 17.0, 7.0, 3.0, 1.0, 9.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.07745361328125, -0.07526493072509766, -0.07307624816894531, -0.07088756561279297, -0.06869888305664062, -0.06651020050048828, -0.06432151794433594, -0.062132835388183594, -0.05994415283203125, -0.057755470275878906, -0.05556678771972656, -0.05337810516357422, -0.051189422607421875, -0.04900074005126953, -0.04681205749511719, -0.044623374938964844, -0.0424346923828125, -0.040246009826660156, -0.03805732727050781, -0.03586864471435547, -0.033679962158203125, -0.03149127960205078, -0.029302597045898438, -0.027113914489746094, -0.02492523193359375, -0.022736549377441406, -0.020547866821289062, -0.01835918426513672, -0.016170501708984375, -0.013981819152832031, -0.011793136596679688, -0.009604454040527344, -0.007415771484375, -0.005227088928222656, -0.0030384063720703125, -0.0008497238159179688, 0.001338958740234375, 0.0035276412963867188, 0.0057163238525390625, 0.007905006408691406, 0.01009368896484375, 0.012282371520996094, 0.014471054077148438, 0.01665973663330078, 0.018848419189453125, 0.02103710174560547, 0.023225784301757812, 0.025414466857910156, 0.0276031494140625, 0.029791831970214844, 0.03198051452636719, 0.03416919708251953, 0.036357879638671875, 0.03854656219482422, 0.04073524475097656, 0.042923927307128906, 0.04511260986328125, 0.047301292419433594, 0.04948997497558594, 0.05167865753173828, 0.053867340087890625, 0.05605602264404297, 0.05824470520019531, 0.060433387756347656, 0.0626220703125]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 7.0, 15.0, 21.0, 52.0, 110.0, 158.0, 146.0, 140.0, 130.0, 112.0, 44.0, 35.0, 20.0, 9.0, 8.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.777843713760376, -0.7365291118621826, -0.6952145099639893, -0.6538999676704407, -0.6125853657722473, -0.571270763874054, -0.5299562215805054, -0.488641619682312, -0.44732701778411865, -0.4060124158859253, -0.3646978437900543, -0.32338327169418335, -0.28206866979599, -0.24075408279895782, -0.19943949580192566, -0.1581249237060547, -0.11681032180786133, -0.07549573481082916, -0.034181147813797, 0.0071334391832351685, 0.048448026180267334, 0.0897626131772995, 0.13107720017433167, 0.17239177227020264, 0.213706374168396, 0.25502097606658936, 0.2963355481624603, 0.3376501202583313, 0.37896472215652466, 0.420279324054718, 0.461593896150589, 0.50290846824646, 0.5442229509353638, 0.5855375528335571, 0.6268521547317505, 0.6681666970252991, 0.7094812989234924, 0.7507959008216858, 0.7921104431152344, 0.8334250450134277, 0.8747396469116211, 0.9160542488098145, 0.9573688507080078, 0.9986833930015564, 1.0399980545043945, 1.0813125371932983, 1.1226271390914917, 1.163941740989685, 1.2052563428878784, 1.2465709447860718, 1.2878855466842651, 1.3292001485824585, 1.3705146312713623, 1.4118292331695557, 1.453143835067749, 1.4944584369659424, 1.5357730388641357, 1.577087640762329, 1.6184022426605225, 1.6597168445587158, 1.7010314464569092, 1.742345929145813, 1.7836605310440063, 1.8249751329421997, 1.866289734840393]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 4.0, 3.0, 7.0, 6.0, 6.0, 6.0, 9.0, 11.0, 14.0, 17.0, 14.0, 17.0, 20.0, 27.0, 24.0, 31.0, 25.0, 37.0, 24.0, 32.0, 42.0, 46.0, 38.0, 42.0, 39.0, 37.0, 36.0, 28.0, 38.0, 34.0, 38.0, 30.0, 31.0, 20.0, 31.0, 23.0, 23.0, 19.0, 15.0, 10.0, 7.0, 5.0, 12.0, 4.0, 2.0, 8.0, 1.0, 4.0, 4.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.6271832585334778, -0.6067649126052856, -0.5863465666770935, -0.5659282207489014, -0.545509934425354, -0.5250915884971619, -0.5046732425689697, -0.4842548966407776, -0.46383655071258545, -0.4434182047843933, -0.42299985885620117, -0.4025815427303314, -0.3821631968021393, -0.36174485087394714, -0.3413265347480774, -0.32090818881988525, -0.3004898428916931, -0.280071496963501, -0.25965315103530884, -0.2392348349094391, -0.21881648898124695, -0.1983981430530548, -0.17797981202602386, -0.15756148099899292, -0.13714313507080078, -0.11672479659318924, -0.0963064581155777, -0.07588811963796616, -0.055469781160354614, -0.03505144268274307, -0.01463310420513153, 0.005785226821899414, 0.026203513145446777, 0.04662185162305832, 0.06704019010066986, 0.0874585285782814, 0.10787686705589294, 0.12829521298408508, 0.14871354401111603, 0.16913187503814697, 0.1895502209663391, 0.20996856689453125, 0.2303868979215622, 0.25080522894859314, 0.2712235748767853, 0.2916419208049774, 0.31206023693084717, 0.3324785828590393, 0.35289692878723145, 0.3733152747154236, 0.3937336206436157, 0.4141519367694855, 0.4345702826976776, 0.45498862862586975, 0.4754069447517395, 0.49582529067993164, 0.5162436366081238, 0.5366619825363159, 0.5570803284645081, 0.5774986743927002, 0.5979169607162476, 0.6183353066444397, 0.6387536525726318, 0.659171998500824, 0.6795903444290161]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 1.0, 2.0, 5.0, 7.0, 9.0, 19.0, 20.0, 29.0, 41.0, 56.0, 93.0, 139.0, 246.0, 433.0, 785.0, 1491.0, 2827.0, 6349.0, 15883.0, 51751.0, 312419.0, 3559417.0, 181304.0, 37758.0, 12545.0, 5182.0, 2433.0, 1252.0, 693.0, 398.0, 247.0, 143.0, 77.0, 63.0, 44.0, 27.0, 33.0, 15.0, 7.0, 5.0, 7.0, 8.0, 7.0, 3.0, 6.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0], "bins": [-0.1744384765625, -0.1690521240234375, -0.163665771484375, -0.1582794189453125, -0.15289306640625, -0.1475067138671875, -0.142120361328125, -0.1367340087890625, -0.13134765625, -0.1259613037109375, -0.120574951171875, -0.1151885986328125, -0.10980224609375, -0.1044158935546875, -0.099029541015625, -0.0936431884765625, -0.0882568359375, -0.0828704833984375, -0.077484130859375, -0.0720977783203125, -0.06671142578125, -0.0613250732421875, -0.055938720703125, -0.0505523681640625, -0.045166015625, -0.0397796630859375, -0.034393310546875, -0.0290069580078125, -0.02362060546875, -0.0182342529296875, -0.012847900390625, -0.0074615478515625, -0.0020751953125, 0.0033111572265625, 0.008697509765625, 0.0140838623046875, 0.01947021484375, 0.0248565673828125, 0.030242919921875, 0.0356292724609375, 0.041015625, 0.0464019775390625, 0.051788330078125, 0.0571746826171875, 0.06256103515625, 0.0679473876953125, 0.073333740234375, 0.0787200927734375, 0.0841064453125, 0.0894927978515625, 0.094879150390625, 0.1002655029296875, 0.10565185546875, 0.1110382080078125, 0.116424560546875, 0.1218109130859375, 0.127197265625, 0.1325836181640625, 0.137969970703125, 0.1433563232421875, 0.14874267578125, 0.1541290283203125, 0.159515380859375, 0.1649017333984375, 0.1702880859375]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 9.0, 8.0, 8.0, 14.0, 23.0, 35.0, 46.0, 52.0, 59.0, 86.0, 89.0, 103.0, 83.0, 79.0, 75.0, 79.0, 41.0, 40.0, 26.0, 17.0, 19.0, 9.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0416259765625, -0.040076255798339844, -0.03852653503417969, -0.03697681427001953, -0.035427093505859375, -0.03387737274169922, -0.03232765197753906, -0.030777931213378906, -0.02922821044921875, -0.027678489685058594, -0.026128768920898438, -0.02457904815673828, -0.023029327392578125, -0.02147960662841797, -0.019929885864257812, -0.018380165100097656, -0.0168304443359375, -0.015280723571777344, -0.013731002807617188, -0.012181282043457031, -0.010631561279296875, -0.009081840515136719, -0.0075321197509765625, -0.005982398986816406, -0.00443267822265625, -0.0028829574584960938, -0.0013332366943359375, 0.00021648406982421875, 0.001766204833984375, 0.0033159255981445312, 0.0048656463623046875, 0.006415367126464844, 0.007965087890625, 0.009514808654785156, 0.011064529418945312, 0.012614250183105469, 0.014163970947265625, 0.01571369171142578, 0.017263412475585938, 0.018813133239746094, 0.02036285400390625, 0.021912574768066406, 0.023462295532226562, 0.02501201629638672, 0.026561737060546875, 0.02811145782470703, 0.029661178588867188, 0.031210899353027344, 0.0327606201171875, 0.034310340881347656, 0.03586006164550781, 0.03740978240966797, 0.038959503173828125, 0.04050922393798828, 0.04205894470214844, 0.043608665466308594, 0.04515838623046875, 0.046708106994628906, 0.04825782775878906, 0.04980754852294922, 0.051357269287109375, 0.05290699005126953, 0.05445671081542969, 0.056006431579589844, 0.05755615234375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 2.0, 9.0, 8.0, 22.0, 50.0, 75.0, 124.0, 195.0, 374.0, 726.0, 1705.0, 4503.0, 15803.0, 83074.0, 1302964.0, 2653488.0, 103694.0, 18889.0, 5015.0, 1815.0, 772.0, 401.0, 233.0, 134.0, 64.0, 50.0, 41.0, 20.0, 10.0, 7.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.224609375, -0.217376708984375, -0.21014404296875, -0.202911376953125, -0.1956787109375, -0.188446044921875, -0.18121337890625, -0.173980712890625, -0.166748046875, -0.159515380859375, -0.15228271484375, -0.145050048828125, -0.1378173828125, -0.130584716796875, -0.12335205078125, -0.116119384765625, -0.10888671875, -0.101654052734375, -0.09442138671875, -0.087188720703125, -0.0799560546875, -0.072723388671875, -0.06549072265625, -0.058258056640625, -0.051025390625, -0.043792724609375, -0.03656005859375, -0.029327392578125, -0.0220947265625, -0.014862060546875, -0.00762939453125, -0.000396728515625, 0.0068359375, 0.014068603515625, 0.02130126953125, 0.028533935546875, 0.0357666015625, 0.042999267578125, 0.05023193359375, 0.057464599609375, 0.064697265625, 0.071929931640625, 0.07916259765625, 0.086395263671875, 0.0936279296875, 0.100860595703125, 0.10809326171875, 0.115325927734375, 0.12255859375, 0.129791259765625, 0.13702392578125, 0.144256591796875, 0.1514892578125, 0.158721923828125, 0.16595458984375, 0.173187255859375, 0.180419921875, 0.187652587890625, 0.19488525390625, 0.202117919921875, 0.2093505859375, 0.216583251953125, 0.22381591796875, 0.231048583984375, 0.23828125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 6.0, 1.0, 4.0, 2.0, 7.0, 6.0, 11.0, 24.0, 19.0, 20.0, 23.0, 67.0, 79.0, 146.0, 285.0, 617.0, 1590.0, 515.0, 243.0, 137.0, 75.0, 64.0, 41.0, 30.0, 15.0, 9.0, 13.0, 8.0, 5.0, 11.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.05377197265625, -0.052001953125, -0.05023193359375, -0.0484619140625, -0.04669189453125, -0.044921875, -0.04315185546875, -0.0413818359375, -0.03961181640625, -0.037841796875, -0.03607177734375, -0.0343017578125, -0.03253173828125, -0.03076171875, -0.02899169921875, -0.0272216796875, -0.02545166015625, -0.023681640625, -0.02191162109375, -0.0201416015625, -0.01837158203125, -0.0166015625, -0.01483154296875, -0.0130615234375, -0.01129150390625, -0.009521484375, -0.00775146484375, -0.0059814453125, -0.00421142578125, -0.00244140625, -0.00067138671875, 0.0010986328125, 0.00286865234375, 0.004638671875, 0.00640869140625, 0.0081787109375, 0.00994873046875, 0.01171875, 0.01348876953125, 0.0152587890625, 0.01702880859375, 0.018798828125, 0.02056884765625, 0.0223388671875, 0.02410888671875, 0.02587890625, 0.02764892578125, 0.0294189453125, 0.03118896484375, 0.032958984375, 0.03472900390625, 0.0364990234375, 0.03826904296875, 0.0400390625, 0.04180908203125, 0.0435791015625, 0.04534912109375, 0.047119140625, 0.04888916015625, 0.0506591796875, 0.05242919921875, 0.05419921875, 0.05596923828125, 0.0577392578125, 0.05950927734375]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 7.0, 17.0, 65.0, 145.0, 281.0, 233.0, 153.0, 57.0, 33.0, 12.0, 5.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4061968922615051, -0.38357627391815186, -0.3609556555747986, -0.3383350372314453, -0.31571441888809204, -0.29309380054473877, -0.2704732120037079, -0.24785259366035461, -0.22523197531700134, -0.20261135697364807, -0.1799907386302948, -0.15737013518810272, -0.13474951684474945, -0.11212889850139618, -0.0895082950592041, -0.06688767671585083, -0.04426705837249756, -0.021646443754434586, 0.0009741708636283875, 0.023594781756401062, 0.046215400099754333, 0.0688360184431076, 0.09145662188529968, 0.11407724022865295, 0.13669785857200623, 0.1593184769153595, 0.18193909525871277, 0.20455969870090485, 0.22718031704425812, 0.2498009353876114, 0.27242153882980347, 0.29504215717315674, 0.3176628351211548, 0.34028345346450806, 0.36290407180786133, 0.3855246901512146, 0.40814530849456787, 0.43076592683792114, 0.453386515378952, 0.4760071337223053, 0.49862775206565857, 0.5212483406066895, 0.5438689589500427, 0.566489577293396, 0.5891101956367493, 0.6117308139801025, 0.6343514323234558, 0.6569720506668091, 0.6795926690101624, 0.7022132873535156, 0.7248339056968689, 0.7474545240402222, 0.7700751423835754, 0.7926957607269287, 0.8153163194656372, 0.8379369974136353, 0.8605575561523438, 0.883178174495697, 0.9057987928390503, 0.9284194111824036, 0.9510400295257568, 0.9736606478691101, 0.9962812662124634, 1.0189018249511719, 1.04152250289917]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 8.0, 2.0, 5.0, 9.0, 15.0, 10.0, 9.0, 13.0, 22.0, 20.0, 18.0, 38.0, 23.0, 22.0, 34.0, 28.0, 28.0, 37.0, 29.0, 38.0, 35.0, 34.0, 45.0, 45.0, 45.0, 37.0, 29.0, 35.0, 29.0, 26.0, 32.0, 26.0, 26.0, 23.0, 22.0, 17.0, 16.0, 16.0, 11.0, 8.0, 13.0, 1.0, 8.0, 7.0, 2.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.16365522146224976, -0.15868541598320007, -0.1537156105041504, -0.14874579012393951, -0.14377598464488983, -0.13880617916584015, -0.13383637368679047, -0.12886656820774078, -0.1238967552781105, -0.11892694979906082, -0.11395713686943054, -0.10898733139038086, -0.10401752591133118, -0.0990477129817009, -0.09407790750265121, -0.08910809457302094, -0.08413828909397125, -0.07916848361492157, -0.07419867068529129, -0.06922886520624161, -0.06425905227661133, -0.059289246797561646, -0.05431944131851196, -0.04934963211417198, -0.044379822909832, -0.03941001370549202, -0.03444020450115204, -0.029470399022102356, -0.024500589817762375, -0.019530780613422394, -0.014560973271727562, -0.00959116593003273, -0.004621356725692749, 0.00034845154732465744, 0.005318259820342064, 0.01028806809335947, 0.015257876366376877, 0.020227685570716858, 0.02519749291241169, 0.03016730025410652, 0.0351371094584465, 0.040106918662786484, 0.045076727867126465, 0.05004653334617615, 0.05501634255051613, 0.05998615175485611, 0.06495595723390579, 0.06992577016353607, 0.07489557564258575, 0.07986538112163544, 0.08483519405126572, 0.0898049995303154, 0.09477481245994568, 0.09974461793899536, 0.10471442341804504, 0.10968422889709473, 0.114654041826725, 0.11962384730577469, 0.12459366023540497, 0.12956346571445465, 0.13453327119350433, 0.1395030915737152, 0.1444728970527649, 0.14944270253181458, 0.15441250801086426]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 6.0, 2.0, 8.0, 10.0, 13.0, 24.0, 25.0, 54.0, 72.0, 124.0, 215.0, 352.0, 711.0, 1406.0, 2971.0, 6940.0, 18393.0, 55577.0, 176340.0, 412769.0, 249793.0, 79768.0, 26002.0, 9506.0, 3782.0, 1730.0, 854.0, 422.0, 271.0, 153.0, 115.0, 48.0, 45.0, 21.0, 11.0, 11.0, 4.0, 2.0, 5.0, 3.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1422119140625, -0.1375732421875, -0.1329345703125, -0.1282958984375, -0.1236572265625, -0.1190185546875, -0.1143798828125, -0.1097412109375, -0.1051025390625, -0.1004638671875, -0.0958251953125, -0.0911865234375, -0.0865478515625, -0.0819091796875, -0.0772705078125, -0.0726318359375, -0.0679931640625, -0.0633544921875, -0.0587158203125, -0.0540771484375, -0.0494384765625, -0.0447998046875, -0.0401611328125, -0.0355224609375, -0.0308837890625, -0.0262451171875, -0.0216064453125, -0.0169677734375, -0.0123291015625, -0.0076904296875, -0.0030517578125, 0.0015869140625, 0.0062255859375, 0.0108642578125, 0.0155029296875, 0.0201416015625, 0.0247802734375, 0.0294189453125, 0.0340576171875, 0.0386962890625, 0.0433349609375, 0.0479736328125, 0.0526123046875, 0.0572509765625, 0.0618896484375, 0.0665283203125, 0.0711669921875, 0.0758056640625, 0.0804443359375, 0.0850830078125, 0.0897216796875, 0.0943603515625, 0.0989990234375, 0.1036376953125, 0.1082763671875, 0.1129150390625, 0.1175537109375, 0.1221923828125, 0.1268310546875, 0.1314697265625, 0.1361083984375, 0.1407470703125, 0.1453857421875, 0.1500244140625, 0.1546630859375]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 6.0, 7.0, 11.0, 15.0, 16.0, 40.0, 37.0, 65.0, 67.0, 76.0, 102.0, 91.0, 91.0, 89.0, 56.0, 59.0, 47.0, 42.0, 32.0, 22.0, 15.0, 7.0, 9.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04156494140625, -0.040015220642089844, -0.03846549987792969, -0.03691577911376953, -0.035366058349609375, -0.03381633758544922, -0.03226661682128906, -0.030716896057128906, -0.02916717529296875, -0.027617454528808594, -0.026067733764648438, -0.02451801300048828, -0.022968292236328125, -0.02141857147216797, -0.019868850708007812, -0.018319129943847656, -0.0167694091796875, -0.015219688415527344, -0.013669967651367188, -0.012120246887207031, -0.010570526123046875, -0.009020805358886719, -0.0074710845947265625, -0.005921363830566406, -0.00437164306640625, -0.0028219223022460938, -0.0012722015380859375, 0.00027751922607421875, 0.001827239990234375, 0.0033769607543945312, 0.0049266815185546875, 0.006476402282714844, 0.008026123046875, 0.009575843811035156, 0.011125564575195312, 0.012675285339355469, 0.014225006103515625, 0.01577472686767578, 0.017324447631835938, 0.018874168395996094, 0.02042388916015625, 0.021973609924316406, 0.023523330688476562, 0.02507305145263672, 0.026622772216796875, 0.02817249298095703, 0.029722213745117188, 0.031271934509277344, 0.0328216552734375, 0.034371376037597656, 0.03592109680175781, 0.03747081756591797, 0.039020538330078125, 0.04057025909423828, 0.04211997985839844, 0.043669700622558594, 0.04521942138671875, 0.046769142150878906, 0.04831886291503906, 0.04986858367919922, 0.051418304443359375, 0.05296802520751953, 0.05451774597167969, 0.056067466735839844, 0.0576171875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 4.0, 5.0, 6.0, 9.0, 24.0, 29.0, 35.0, 48.0, 81.0, 117.0, 180.0, 261.0, 448.0, 698.0, 1331.0, 3320.0, 11368.0, 59290.0, 315145.0, 501621.0, 122916.0, 22055.0, 5270.0, 1920.0, 947.0, 534.0, 309.0, 180.0, 132.0, 88.0, 52.0, 39.0, 29.0, 17.0, 12.0, 13.0, 6.0, 4.0, 3.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18115234375, -0.1751556396484375, -0.169158935546875, -0.1631622314453125, -0.15716552734375, -0.1511688232421875, -0.145172119140625, -0.1391754150390625, -0.1331787109375, -0.1271820068359375, -0.121185302734375, -0.1151885986328125, -0.10919189453125, -0.1031951904296875, -0.097198486328125, -0.0912017822265625, -0.085205078125, -0.0792083740234375, -0.073211669921875, -0.0672149658203125, -0.06121826171875, -0.0552215576171875, -0.049224853515625, -0.0432281494140625, -0.0372314453125, -0.0312347412109375, -0.025238037109375, -0.0192413330078125, -0.01324462890625, -0.0072479248046875, -0.001251220703125, 0.0047454833984375, 0.0107421875, 0.0167388916015625, 0.022735595703125, 0.0287322998046875, 0.03472900390625, 0.0407257080078125, 0.046722412109375, 0.0527191162109375, 0.0587158203125, 0.0647125244140625, 0.070709228515625, 0.0767059326171875, 0.08270263671875, 0.0886993408203125, 0.094696044921875, 0.1006927490234375, 0.106689453125, 0.1126861572265625, 0.118682861328125, 0.1246795654296875, 0.13067626953125, 0.1366729736328125, 0.142669677734375, 0.1486663818359375, 0.1546630859375, 0.1606597900390625, 0.166656494140625, 0.1726531982421875, 0.17864990234375, 0.1846466064453125, 0.190643310546875, 0.1966400146484375, 0.20263671875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 2.0, 5.0, 4.0, 2.0, 7.0, 6.0, 9.0, 12.0, 16.0, 27.0, 26.0, 22.0, 28.0, 16.0, 23.0, 31.0, 36.0, 47.0, 48.0, 49.0, 49.0, 42.0, 43.0, 46.0, 43.0, 39.0, 46.0, 42.0, 22.0, 29.0, 31.0, 34.0, 24.0, 21.0, 21.0, 11.0, 9.0, 6.0, 8.0, 6.0, 6.0, 6.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.135498046875, -0.1314382553100586, -0.1273784637451172, -0.12331867218017578, -0.11925888061523438, -0.11519908905029297, -0.11113929748535156, -0.10707950592041016, -0.10301971435546875, -0.09895992279052734, -0.09490013122558594, -0.09084033966064453, -0.08678054809570312, -0.08272075653076172, -0.07866096496582031, -0.0746011734008789, -0.0705413818359375, -0.0664815902709961, -0.06242179870605469, -0.05836200714111328, -0.054302215576171875, -0.05024242401123047, -0.04618263244628906, -0.042122840881347656, -0.03806304931640625, -0.034003257751464844, -0.029943466186523438, -0.02588367462158203, -0.021823883056640625, -0.01776409149169922, -0.013704299926757812, -0.009644508361816406, -0.005584716796875, -0.0015249252319335938, 0.0025348663330078125, 0.006594657897949219, 0.010654449462890625, 0.014714241027832031, 0.018774032592773438, 0.022833824157714844, 0.02689361572265625, 0.030953407287597656, 0.03501319885253906, 0.03907299041748047, 0.043132781982421875, 0.04719257354736328, 0.05125236511230469, 0.055312156677246094, 0.0593719482421875, 0.0634317398071289, 0.06749153137207031, 0.07155132293701172, 0.07561111450195312, 0.07967090606689453, 0.08373069763183594, 0.08779048919677734, 0.09185028076171875, 0.09591007232666016, 0.09996986389160156, 0.10402965545654297, 0.10808944702148438, 0.11214923858642578, 0.11620903015136719, 0.1202688217163086, 0.12432861328125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 0.0, 4.0, 4.0, 5.0, 10.0, 16.0, 22.0, 41.0, 103.0, 262.0, 687.0, 2217.0, 8971.0, 48120.0, 452600.0, 472541.0, 50159.0, 9263.0, 2299.0, 759.0, 259.0, 98.0, 56.0, 31.0, 18.0, 8.0, 2.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.103759765625, -0.09961128234863281, -0.09546279907226562, -0.09131431579589844, -0.08716583251953125, -0.08301734924316406, -0.07886886596679688, -0.07472038269042969, -0.0705718994140625, -0.06642341613769531, -0.062274932861328125, -0.05812644958496094, -0.05397796630859375, -0.04982948303222656, -0.045680999755859375, -0.04153251647949219, -0.037384033203125, -0.03323554992675781, -0.029087066650390625, -0.024938583374023438, -0.02079010009765625, -0.016641616821289062, -0.012493133544921875, -0.008344650268554688, -0.0041961669921875, -4.76837158203125e-05, 0.004100799560546875, 0.008249282836914062, 0.01239776611328125, 0.016546249389648438, 0.020694732666015625, 0.024843215942382812, 0.02899169921875, 0.03314018249511719, 0.037288665771484375, 0.04143714904785156, 0.04558563232421875, 0.04973411560058594, 0.053882598876953125, 0.05803108215332031, 0.0621795654296875, 0.06632804870605469, 0.07047653198242188, 0.07462501525878906, 0.07877349853515625, 0.08292198181152344, 0.08707046508789062, 0.09121894836425781, 0.095367431640625, 0.09951591491699219, 0.10366439819335938, 0.10781288146972656, 0.11196136474609375, 0.11610984802246094, 0.12025833129882812, 0.12440681457519531, 0.1285552978515625, 0.1327037811279297, 0.13685226440429688, 0.14100074768066406, 0.14514923095703125, 0.14929771423339844, 0.15344619750976562, 0.1575946807861328, 0.1617431640625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 2.0, 2.0, 3.0, 7.0, 3.0, 4.0, 13.0, 7.0, 7.0, 12.0, 17.0, 25.0, 17.0, 25.0, 35.0, 53.0, 63.0, 58.0, 66.0, 77.0, 78.0, 73.0, 57.0, 48.0, 60.0, 38.0, 40.0, 19.0, 23.0, 20.0, 14.0, 6.0, 15.0, 5.0, 4.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.529424667358398e-05, -8.270237594842911e-05, -8.011050522327423e-05, -7.751863449811935e-05, -7.492676377296448e-05, -7.23348930478096e-05, -6.974302232265472e-05, -6.715115159749985e-05, -6.455928087234497e-05, -6.19674101471901e-05, -5.937553942203522e-05, -5.678366869688034e-05, -5.4191797971725464e-05, -5.159992724657059e-05, -4.900805652141571e-05, -4.6416185796260834e-05, -4.382431507110596e-05, -4.123244434595108e-05, -3.8640573620796204e-05, -3.604870289564133e-05, -3.345683217048645e-05, -3.0864961445331573e-05, -2.8273090720176697e-05, -2.568121999502182e-05, -2.3089349269866943e-05, -2.0497478544712067e-05, -1.790560781955719e-05, -1.5313737094402313e-05, -1.2721866369247437e-05, -1.012999564409256e-05, -7.538124918937683e-06, -4.946254193782806e-06, -2.3543834686279297e-06, 2.3748725652694702e-07, 2.8293579816818237e-06, 5.4212287068367004e-06, 8.013099431991577e-06, 1.0604970157146454e-05, 1.319684088230133e-05, 1.5788711607456207e-05, 1.8380582332611084e-05, 2.097245305776596e-05, 2.3564323782920837e-05, 2.6156194508075714e-05, 2.874806523323059e-05, 3.133993595838547e-05, 3.3931806683540344e-05, 3.652367740869522e-05, 3.91155481338501e-05, 4.1707418859004974e-05, 4.429928958415985e-05, 4.689116030931473e-05, 4.9483031034469604e-05, 5.207490175962448e-05, 5.466677248477936e-05, 5.7258643209934235e-05, 5.985051393508911e-05, 6.244238466024399e-05, 6.503425538539886e-05, 6.762612611055374e-05, 7.021799683570862e-05, 7.28098675608635e-05, 7.540173828601837e-05, 7.799360901117325e-05, 8.058547973632812e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 4.0, 2.0, 7.0, 9.0, 24.0, 33.0, 37.0, 47.0, 93.0, 132.0, 245.0, 461.0, 1056.0, 2847.0, 8872.0, 40139.0, 320006.0, 578183.0, 75284.0, 14221.0, 3979.0, 1498.0, 620.0, 325.0, 167.0, 85.0, 64.0, 44.0, 21.0, 20.0, 12.0, 6.0, 5.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10693359375, -0.10326766967773438, -0.09960174560546875, -0.09593582153320312, -0.0922698974609375, -0.08860397338867188, -0.08493804931640625, -0.08127212524414062, -0.077606201171875, -0.07394027709960938, -0.07027435302734375, -0.06660842895507812, -0.0629425048828125, -0.059276580810546875, -0.05561065673828125, -0.051944732666015625, -0.04827880859375, -0.044612884521484375, -0.04094696044921875, -0.037281036376953125, -0.0336151123046875, -0.029949188232421875, -0.02628326416015625, -0.022617340087890625, -0.018951416015625, -0.015285491943359375, -0.01161956787109375, -0.007953643798828125, -0.0042877197265625, -0.000621795654296875, 0.00304412841796875, 0.006710052490234375, 0.0103759765625, 0.014041900634765625, 0.01770782470703125, 0.021373748779296875, 0.0250396728515625, 0.028705596923828125, 0.03237152099609375, 0.036037445068359375, 0.039703369140625, 0.043369293212890625, 0.04703521728515625, 0.050701141357421875, 0.0543670654296875, 0.058032989501953125, 0.06169891357421875, 0.06536483764648438, 0.06903076171875, 0.07269668579101562, 0.07636260986328125, 0.08002853393554688, 0.0836944580078125, 0.08736038208007812, 0.09102630615234375, 0.09469223022460938, 0.098358154296875, 0.10202407836914062, 0.10569000244140625, 0.10935592651367188, 0.1130218505859375, 0.11668777465820312, 0.12035369873046875, 0.12401962280273438, 0.127685546875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 3.0, 5.0, 6.0, 8.0, 8.0, 12.0, 14.0, 25.0, 37.0, 55.0, 69.0, 84.0, 110.0, 104.0, 124.0, 87.0, 64.0, 64.0, 39.0, 23.0, 11.0, 12.0, 13.0, 5.0, 5.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06494140625, -0.062483787536621094, -0.06002616882324219, -0.05756855010986328, -0.055110931396484375, -0.05265331268310547, -0.05019569396972656, -0.047738075256347656, -0.04528045654296875, -0.042822837829589844, -0.04036521911621094, -0.03790760040283203, -0.035449981689453125, -0.03299236297607422, -0.030534744262695312, -0.028077125549316406, -0.0256195068359375, -0.023161888122558594, -0.020704269409179688, -0.01824665069580078, -0.015789031982421875, -0.013331413269042969, -0.010873794555664062, -0.008416175842285156, -0.00595855712890625, -0.0035009384155273438, -0.0010433197021484375, 0.0014142990112304688, 0.003871917724609375, 0.006329536437988281, 0.008787155151367188, 0.011244773864746094, 0.013702392578125, 0.016160011291503906, 0.018617630004882812, 0.02107524871826172, 0.023532867431640625, 0.02599048614501953, 0.028448104858398438, 0.030905723571777344, 0.03336334228515625, 0.035820960998535156, 0.03827857971191406, 0.04073619842529297, 0.043193817138671875, 0.04565143585205078, 0.04810905456542969, 0.050566673278808594, 0.0530242919921875, 0.055481910705566406, 0.05793952941894531, 0.06039714813232422, 0.06285476684570312, 0.06531238555908203, 0.06777000427246094, 0.07022762298583984, 0.07268524169921875, 0.07514286041259766, 0.07760047912597656, 0.08005809783935547, 0.08251571655273438, 0.08497333526611328, 0.08743095397949219, 0.0898885726928711, 0.09234619140625]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 5.0, 11.0, 47.0, 148.0, 230.0, 271.0, 170.0, 85.0, 24.0, 10.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0983920097351074, -1.0309560298919678, -0.9635199308395386, -0.8960839509963989, -0.8286479115486145, -0.7612118721008301, -0.6937758922576904, -0.626339852809906, -0.5589038133621216, -0.49146777391433716, -0.4240317642688751, -0.3565957546234131, -0.28915971517562866, -0.22172367572784424, -0.1542876660823822, -0.08685165643692017, -0.019415616989135742, 0.04802040755748749, 0.11545643210411072, 0.18289245665073395, 0.2503284811973572, 0.3177645206451416, 0.38520053029060364, 0.4526365399360657, 0.5200725793838501, 0.5875086188316345, 0.654944658279419, 0.7223806381225586, 0.789816677570343, 0.8572527170181274, 0.9246886968612671, 0.9921247363090515, 1.059560775756836, 1.1269967555999756, 1.1944328546524048, 1.2618688344955444, 1.3293049335479736, 1.3967409133911133, 1.464176893234253, 1.5316128730773926, 1.5990489721298218, 1.6664849519729614, 1.7339210510253906, 1.8013570308685303, 1.86879301071167, 1.9362291097640991, 2.0036652088165283, 2.071101188659668, 2.1385371685028076, 2.2059731483459473, 2.273409128189087, 2.3408453464508057, 2.4082813262939453, 2.475717306137085, 2.5431532859802246, 2.6105892658233643, 2.678025245666504, 2.7454612255096436, 2.812897205352783, 2.880333423614502, 2.9477694034576416, 3.0152053833007812, 3.082641363143921, 3.1500773429870605, 3.2175135612487793]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 8.0, 4.0, 8.0, 14.0, 13.0, 18.0, 24.0, 30.0, 22.0, 38.0, 39.0, 60.0, 49.0, 52.0, 63.0, 58.0, 59.0, 70.0, 63.0, 50.0, 39.0, 49.0, 34.0, 38.0, 18.0, 21.0, 17.0, 13.0, 12.0, 4.0, 9.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0601372718811035, -1.0322436094284058, -1.004349946975708, -0.9764561653137207, -0.948562502861023, -0.9206688404083252, -0.8927751183509827, -0.8648813962936401, -0.8369877338409424, -0.8090940713882446, -0.7812003493309021, -0.7533066272735596, -0.7254129648208618, -0.6975193023681641, -0.6696255803108215, -0.641731858253479, -0.6138381958007812, -0.5859445333480835, -0.558050811290741, -0.5301570892333984, -0.5022634267807007, -0.47436973452568054, -0.4464760422706604, -0.41858235001564026, -0.3906886577606201, -0.3627949655056, -0.33490127325057983, -0.3070075809955597, -0.27911388874053955, -0.2512201964855194, -0.22332650423049927, -0.19543281197547913, -0.1675390601158142, -0.13964536786079407, -0.11175167560577393, -0.08385798335075378, -0.05596429109573364, -0.0280705988407135, -0.00017690658569335938, 0.027716785669326782, 0.055610477924346924, 0.08350417017936707, 0.11139786243438721, 0.13929155468940735, 0.1671852469444275, 0.19507893919944763, 0.22297263145446777, 0.2508663237094879, 0.27876001596450806, 0.3066537082195282, 0.33454740047454834, 0.3624410927295685, 0.3903347849845886, 0.41822847723960876, 0.4461221694946289, 0.47401586174964905, 0.5019095540046692, 0.5298032760620117, 0.5576969385147095, 0.5855906009674072, 0.6134843230247498, 0.6413780450820923, 0.66927170753479, 0.6971653699874878, 0.7250590920448303]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 8.0, 8.0, 11.0, 18.0, 15.0, 32.0, 67.0, 87.0, 190.0, 292.0, 513.0, 1064.0, 2070.0, 4820.0, 12212.0, 36979.0, 162584.0, 3032135.0, 808167.0, 92017.0, 24793.0, 8718.0, 3775.0, 1637.0, 901.0, 457.0, 255.0, 171.0, 106.0, 67.0, 34.0, 26.0, 22.0, 15.0, 10.0, 8.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.164306640625, -0.15914535522460938, -0.15398406982421875, -0.14882278442382812, -0.1436614990234375, -0.13850021362304688, -0.13333892822265625, -0.12817764282226562, -0.123016357421875, -0.11785507202148438, -0.11269378662109375, -0.10753250122070312, -0.1023712158203125, -0.09720993041992188, -0.09204864501953125, -0.08688735961914062, -0.08172607421875, -0.07656478881835938, -0.07140350341796875, -0.06624221801757812, -0.0610809326171875, -0.055919647216796875, -0.05075836181640625, -0.045597076416015625, -0.040435791015625, -0.035274505615234375, -0.03011322021484375, -0.024951934814453125, -0.0197906494140625, -0.014629364013671875, -0.00946807861328125, -0.004306793212890625, 0.0008544921875, 0.006015777587890625, 0.01117706298828125, 0.016338348388671875, 0.0214996337890625, 0.026660919189453125, 0.03182220458984375, 0.036983489990234375, 0.042144775390625, 0.047306060791015625, 0.05246734619140625, 0.057628631591796875, 0.0627899169921875, 0.06795120239257812, 0.07311248779296875, 0.07827377319335938, 0.08343505859375, 0.08859634399414062, 0.09375762939453125, 0.09891891479492188, 0.1040802001953125, 0.10924148559570312, 0.11440277099609375, 0.11956405639648438, 0.124725341796875, 0.12988662719726562, 0.13504791259765625, 0.14020919799804688, 0.1453704833984375, 0.15053176879882812, 0.15569305419921875, 0.16085433959960938, 0.166015625]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 11.0, 9.0, 14.0, 22.0, 28.0, 40.0, 52.0, 73.0, 87.0, 106.0, 85.0, 93.0, 68.0, 77.0, 66.0, 43.0, 33.0, 31.0, 15.0, 20.0, 11.0, 10.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0452880859375, -0.043773651123046875, -0.04225921630859375, -0.040744781494140625, -0.0392303466796875, -0.037715911865234375, -0.03620147705078125, -0.034687042236328125, -0.033172607421875, -0.031658172607421875, -0.03014373779296875, -0.028629302978515625, -0.0271148681640625, -0.025600433349609375, -0.02408599853515625, -0.022571563720703125, -0.02105712890625, -0.019542694091796875, -0.01802825927734375, -0.016513824462890625, -0.0149993896484375, -0.013484954833984375, -0.01197052001953125, -0.010456085205078125, -0.008941650390625, -0.007427215576171875, -0.00591278076171875, -0.004398345947265625, -0.0028839111328125, -0.001369476318359375, 0.00014495849609375, 0.001659393310546875, 0.003173828125, 0.004688262939453125, 0.00620269775390625, 0.007717132568359375, 0.0092315673828125, 0.010746002197265625, 0.01226043701171875, 0.013774871826171875, 0.015289306640625, 0.016803741455078125, 0.01831817626953125, 0.019832611083984375, 0.0213470458984375, 0.022861480712890625, 0.02437591552734375, 0.025890350341796875, 0.02740478515625, 0.028919219970703125, 0.03043365478515625, 0.031948089599609375, 0.0334625244140625, 0.034976959228515625, 0.03649139404296875, 0.038005828857421875, 0.039520263671875, 0.041034698486328125, 0.04254913330078125, 0.044063568115234375, 0.0455780029296875, 0.047092437744140625, 0.04860687255859375, 0.050121307373046875, 0.0516357421875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 4.0, 3.0, 6.0, 4.0, 9.0, 5.0, 13.0, 14.0, 9.0, 33.0, 33.0, 59.0, 95.0, 137.0, 241.0, 435.0, 818.0, 1636.0, 3674.0, 8841.0, 24660.0, 79790.0, 355200.0, 2772875.0, 751955.0, 132669.0, 38043.0, 13334.0, 5114.0, 2193.0, 1023.0, 598.0, 261.0, 195.0, 100.0, 67.0, 43.0, 32.0, 17.0, 14.0, 9.0, 7.0, 9.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.138916015625, -0.13479232788085938, -0.13066864013671875, -0.12654495239257812, -0.1224212646484375, -0.11829757690429688, -0.11417388916015625, -0.11005020141601562, -0.105926513671875, -0.10180282592773438, -0.09767913818359375, -0.09355545043945312, -0.0894317626953125, -0.08530807495117188, -0.08118438720703125, -0.07706069946289062, -0.07293701171875, -0.06881332397460938, -0.06468963623046875, -0.060565948486328125, -0.0564422607421875, -0.052318572998046875, -0.04819488525390625, -0.044071197509765625, -0.039947509765625, -0.035823822021484375, -0.03170013427734375, -0.027576446533203125, -0.0234527587890625, -0.019329071044921875, -0.01520538330078125, -0.011081695556640625, -0.0069580078125, -0.002834320068359375, 0.00128936767578125, 0.005413055419921875, 0.0095367431640625, 0.013660430908203125, 0.01778411865234375, 0.021907806396484375, 0.026031494140625, 0.030155181884765625, 0.03427886962890625, 0.038402557373046875, 0.0425262451171875, 0.046649932861328125, 0.05077362060546875, 0.054897308349609375, 0.05902099609375, 0.06314468383789062, 0.06726837158203125, 0.07139205932617188, 0.0755157470703125, 0.07963943481445312, 0.08376312255859375, 0.08788681030273438, 0.092010498046875, 0.09613418579101562, 0.10025787353515625, 0.10438156127929688, 0.1085052490234375, 0.11262893676757812, 0.11675262451171875, 0.12087631225585938, 0.125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 6.0, 0.0, 8.0, 8.0, 9.0, 15.0, 19.0, 24.0, 32.0, 37.0, 55.0, 88.0, 117.0, 181.0, 273.0, 515.0, 922.0, 693.0, 346.0, 221.0, 139.0, 79.0, 71.0, 47.0, 37.0, 30.0, 25.0, 16.0, 22.0, 5.0, 6.0, 6.0, 8.0, 5.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.047088623046875, -0.04532766342163086, -0.04356670379638672, -0.04180574417114258, -0.04004478454589844, -0.0382838249206543, -0.036522865295410156, -0.034761905670166016, -0.033000946044921875, -0.031239986419677734, -0.029479026794433594, -0.027718067169189453, -0.025957107543945312, -0.024196147918701172, -0.02243518829345703, -0.02067422866821289, -0.01891326904296875, -0.01715230941772461, -0.015391349792480469, -0.013630390167236328, -0.011869430541992188, -0.010108470916748047, -0.008347511291503906, -0.006586551666259766, -0.004825592041015625, -0.0030646324157714844, -0.0013036727905273438, 0.0004572868347167969, 0.0022182464599609375, 0.003979206085205078, 0.005740165710449219, 0.007501125335693359, 0.0092620849609375, 0.01102304458618164, 0.012784004211425781, 0.014544963836669922, 0.016305923461914062, 0.018066883087158203, 0.019827842712402344, 0.021588802337646484, 0.023349761962890625, 0.025110721588134766, 0.026871681213378906, 0.028632640838623047, 0.030393600463867188, 0.03215456008911133, 0.03391551971435547, 0.03567647933959961, 0.03743743896484375, 0.03919839859008789, 0.04095935821533203, 0.04272031784057617, 0.04448127746582031, 0.04624223709106445, 0.048003196716308594, 0.049764156341552734, 0.051525115966796875, 0.053286075592041016, 0.055047035217285156, 0.0568079948425293, 0.05856895446777344, 0.06032991409301758, 0.06209087371826172, 0.06385183334350586, 0.06561279296875]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 9.0, 10.0, 25.0, 32.0, 72.0, 141.0, 190.0, 194.0, 157.0, 94.0, 39.0, 25.0, 8.0, 5.0, 3.0, 2.0, 1.0, 0.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5548077821731567, -0.5319732427597046, -0.5091387629508972, -0.48630422353744507, -0.4634696841239929, -0.44063517451286316, -0.4178006649017334, -0.39496612548828125, -0.3721315860748291, -0.34929707646369934, -0.3264625370502472, -0.30362802743911743, -0.2807934880256653, -0.2579589784145355, -0.23512445390224457, -0.2122899293899536, -0.18945541977882385, -0.1666208952665329, -0.14378637075424194, -0.12095185369253159, -0.09811732918024063, -0.07528280466794968, -0.05244828760623932, -0.029613763093948364, -0.00677923858165741, 0.016055284067988396, 0.0388898067176342, 0.06172432750463486, 0.08455885201692581, 0.10739337652921677, 0.13022789359092712, 0.15306241810321808, 0.17589694261550903, 0.1987314671278, 0.22156599164009094, 0.2444005012512207, 0.26723504066467285, 0.2900695502758026, 0.3129040598869324, 0.3357385993003845, 0.35857313871383667, 0.38140764832496643, 0.4042421877384186, 0.42707669734954834, 0.4499112367630005, 0.47274574637413025, 0.49558025598526, 0.5184147953987122, 0.5412492752075195, 0.5640838146209717, 0.586918294429779, 0.6097528338432312, 0.6325873732566833, 0.6554219126701355, 0.6782563924789429, 0.701090931892395, 0.7239254713058472, 0.7467600107192993, 0.7695944905281067, 0.7924290299415588, 0.815263569355011, 0.8380981087684631, 0.8609325885772705, 0.8837671279907227, 0.9066016674041748]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 4.0, 5.0, 9.0, 10.0, 8.0, 11.0, 12.0, 17.0, 16.0, 29.0, 33.0, 19.0, 24.0, 27.0, 28.0, 32.0, 30.0, 41.0, 31.0, 42.0, 39.0, 44.0, 35.0, 36.0, 37.0, 44.0, 45.0, 37.0, 32.0, 34.0, 30.0, 23.0, 21.0, 24.0, 15.0, 13.0, 18.0, 8.0, 9.0, 8.0, 5.0, 6.0, 1.0, 1.0, 5.0, 3.0, 2.0, 0.0, 1.0, 4.0, 1.0], "bins": [-0.23109257221221924, -0.22414252161979675, -0.21719247102737427, -0.21024242043495178, -0.2032923549413681, -0.19634230434894562, -0.18939225375652313, -0.18244220316410065, -0.17549213767051697, -0.16854208707809448, -0.161592036485672, -0.1546419858932495, -0.14769192039966583, -0.14074186980724335, -0.13379181921482086, -0.12684176862239838, -0.11989171802997589, -0.1129416674375534, -0.10599160939455032, -0.09904155880212784, -0.09209150075912476, -0.08514145016670227, -0.07819139957427979, -0.0712413489818573, -0.06429129093885422, -0.057341236621141434, -0.05039118230342865, -0.043441131711006165, -0.03649107739329338, -0.029541023075580597, -0.02259097248315811, -0.015640918165445328, -0.008690863847732544, -0.0017408104613423347, 0.0052092429250478745, 0.012159295380115509, 0.019109349697828293, 0.026059404015541077, 0.03300945460796356, 0.039959508925676346, 0.04690956324338913, 0.05385961756110191, 0.0608096718788147, 0.06775972247123718, 0.07470977306365967, 0.08165983110666275, 0.08860988169908524, 0.09555993974208832, 0.1025099903345108, 0.10946004092693329, 0.11641009896993637, 0.12336014956235886, 0.13031020760536194, 0.13726025819778442, 0.1442103087902069, 0.1511603593826294, 0.15811040997505188, 0.16506046056747437, 0.17201051115989685, 0.17896056175231934, 0.18591062724590302, 0.1928606778383255, 0.19981072843074799, 0.20676077902317047, 0.21371084451675415]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 6.0, 15.0, 14.0, 33.0, 44.0, 74.0, 125.0, 164.0, 369.0, 666.0, 1460.0, 3597.0, 9832.0, 31016.0, 107243.0, 443507.0, 331702.0, 81494.0, 24110.0, 7751.0, 2820.0, 1170.0, 598.0, 279.0, 183.0, 107.0, 68.0, 42.0, 28.0, 14.0, 14.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1884765625, -0.18217086791992188, -0.17586517333984375, -0.16955947875976562, -0.1632537841796875, -0.15694808959960938, -0.15064239501953125, -0.14433670043945312, -0.138031005859375, -0.13172531127929688, -0.12541961669921875, -0.11911392211914062, -0.1128082275390625, -0.10650253295898438, -0.10019683837890625, -0.09389114379882812, -0.08758544921875, -0.08127975463867188, -0.07497406005859375, -0.06866836547851562, -0.0623626708984375, -0.056056976318359375, -0.04975128173828125, -0.043445587158203125, -0.037139892578125, -0.030834197998046875, -0.02452850341796875, -0.018222808837890625, -0.0119171142578125, -0.005611419677734375, 0.00069427490234375, 0.006999969482421875, 0.0133056640625, 0.019611358642578125, 0.02591705322265625, 0.032222747802734375, 0.0385284423828125, 0.044834136962890625, 0.05113983154296875, 0.057445526123046875, 0.063751220703125, 0.07005691528320312, 0.07636260986328125, 0.08266830444335938, 0.0889739990234375, 0.09527969360351562, 0.10158538818359375, 0.10789108276367188, 0.11419677734375, 0.12050247192382812, 0.12680816650390625, 0.13311386108398438, 0.1394195556640625, 0.14572525024414062, 0.15203094482421875, 0.15833663940429688, 0.164642333984375, 0.17094802856445312, 0.17725372314453125, 0.18355941772460938, 0.1898651123046875, 0.19617080688476562, 0.20247650146484375, 0.20878219604492188, 0.215087890625]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 10.0, 4.0, 18.0, 17.0, 31.0, 32.0, 49.0, 61.0, 89.0, 109.0, 102.0, 78.0, 87.0, 93.0, 52.0, 51.0, 36.0, 32.0, 17.0, 17.0, 10.0, 4.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.046875, -0.04526042938232422, -0.04364585876464844, -0.042031288146972656, -0.040416717529296875, -0.038802146911621094, -0.03718757629394531, -0.03557300567626953, -0.03395843505859375, -0.03234386444091797, -0.030729293823242188, -0.029114723205566406, -0.027500152587890625, -0.025885581970214844, -0.024271011352539062, -0.02265644073486328, -0.0210418701171875, -0.01942729949951172, -0.017812728881835938, -0.016198158264160156, -0.014583587646484375, -0.012969017028808594, -0.011354446411132812, -0.009739875793457031, -0.00812530517578125, -0.006510734558105469, -0.0048961639404296875, -0.0032815933227539062, -0.001667022705078125, -5.245208740234375e-05, 0.0015621185302734375, 0.0031766891479492188, 0.004791259765625, 0.006405830383300781, 0.008020401000976562, 0.009634971618652344, 0.011249542236328125, 0.012864112854003906, 0.014478683471679688, 0.01609325408935547, 0.01770782470703125, 0.01932239532470703, 0.020936965942382812, 0.022551536560058594, 0.024166107177734375, 0.025780677795410156, 0.027395248413085938, 0.02900981903076172, 0.0306243896484375, 0.03223896026611328, 0.03385353088378906, 0.035468101501464844, 0.037082672119140625, 0.038697242736816406, 0.04031181335449219, 0.04192638397216797, 0.04354095458984375, 0.04515552520751953, 0.04677009582519531, 0.048384666442871094, 0.049999237060546875, 0.051613807678222656, 0.05322837829589844, 0.05484294891357422, 0.05645751953125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 11.0, 9.0, 24.0, 23.0, 38.0, 55.0, 86.0, 125.0, 193.0, 340.0, 638.0, 1272.0, 2972.0, 8603.0, 30731.0, 127662.0, 511101.0, 276997.0, 62555.0, 16154.0, 5006.0, 1892.0, 857.0, 464.0, 300.0, 166.0, 86.0, 76.0, 33.0, 31.0, 20.0, 13.0, 9.0, 10.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1824951171875, -0.1769237518310547, -0.17135238647460938, -0.16578102111816406, -0.16020965576171875, -0.15463829040527344, -0.14906692504882812, -0.1434955596923828, -0.1379241943359375, -0.1323528289794922, -0.12678146362304688, -0.12121009826660156, -0.11563873291015625, -0.11006736755371094, -0.10449600219726562, -0.09892463684082031, -0.093353271484375, -0.08778190612792969, -0.08221054077148438, -0.07663917541503906, -0.07106781005859375, -0.06549644470214844, -0.059925079345703125, -0.05435371398925781, -0.0487823486328125, -0.04321098327636719, -0.037639617919921875, -0.03206825256347656, -0.02649688720703125, -0.020925521850585938, -0.015354156494140625, -0.009782791137695312, -0.00421142578125, 0.0013599395751953125, 0.006931304931640625, 0.012502670288085938, 0.01807403564453125, 0.023645401000976562, 0.029216766357421875, 0.03478813171386719, 0.0403594970703125, 0.04593086242675781, 0.051502227783203125, 0.05707359313964844, 0.06264495849609375, 0.06821632385253906, 0.07378768920898438, 0.07935905456542969, 0.084930419921875, 0.09050178527832031, 0.09607315063476562, 0.10164451599121094, 0.10721588134765625, 0.11278724670410156, 0.11835861206054688, 0.12392997741699219, 0.1295013427734375, 0.1350727081298828, 0.14064407348632812, 0.14621543884277344, 0.15178680419921875, 0.15735816955566406, 0.16292953491210938, 0.1685009002685547, 0.174072265625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 3.0, 6.0, 7.0, 14.0, 12.0, 16.0, 17.0, 13.0, 24.0, 23.0, 25.0, 32.0, 36.0, 45.0, 42.0, 36.0, 41.0, 35.0, 54.0, 51.0, 51.0, 35.0, 48.0, 52.0, 36.0, 29.0, 30.0, 23.0, 26.0, 23.0, 14.0, 19.0, 13.0, 14.0, 18.0, 9.0, 8.0, 7.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.131103515625, -0.1270771026611328, -0.12305068969726562, -0.11902427673339844, -0.11499786376953125, -0.11097145080566406, -0.10694503784179688, -0.10291862487792969, -0.0988922119140625, -0.09486579895019531, -0.09083938598632812, -0.08681297302246094, -0.08278656005859375, -0.07876014709472656, -0.07473373413085938, -0.07070732116699219, -0.066680908203125, -0.06265449523925781, -0.058628082275390625, -0.05460166931152344, -0.05057525634765625, -0.04654884338378906, -0.042522430419921875, -0.03849601745605469, -0.0344696044921875, -0.030443191528320312, -0.026416778564453125, -0.022390365600585938, -0.01836395263671875, -0.014337539672851562, -0.010311126708984375, -0.0062847137451171875, -0.00225830078125, 0.0017681121826171875, 0.005794525146484375, 0.009820938110351562, 0.01384735107421875, 0.017873764038085938, 0.021900177001953125, 0.025926589965820312, 0.0299530029296875, 0.03397941589355469, 0.038005828857421875, 0.04203224182128906, 0.04605865478515625, 0.05008506774902344, 0.054111480712890625, 0.05813789367675781, 0.062164306640625, 0.06619071960449219, 0.07021713256835938, 0.07424354553222656, 0.07826995849609375, 0.08229637145996094, 0.08632278442382812, 0.09034919738769531, 0.0943756103515625, 0.09840202331542969, 0.10242843627929688, 0.10645484924316406, 0.11048126220703125, 0.11450767517089844, 0.11853408813476562, 0.12256050109863281, 0.1265869140625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 12.0, 2.0, 9.0, 14.0, 22.0, 21.0, 52.0, 79.0, 118.0, 208.0, 359.0, 612.0, 1288.0, 3015.0, 7819.0, 23608.0, 94066.0, 489736.0, 335278.0, 63990.0, 17509.0, 6039.0, 2381.0, 1021.0, 583.0, 298.0, 147.0, 95.0, 61.0, 42.0, 17.0, 17.0, 12.0, 10.0, 6.0, 4.0, 0.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11175537109375, -0.10835552215576172, -0.10495567321777344, -0.10155582427978516, -0.09815597534179688, -0.0947561264038086, -0.09135627746582031, -0.08795642852783203, -0.08455657958984375, -0.08115673065185547, -0.07775688171386719, -0.0743570327758789, -0.07095718383789062, -0.06755733489990234, -0.06415748596191406, -0.06075763702392578, -0.0573577880859375, -0.05395793914794922, -0.05055809020996094, -0.047158241271972656, -0.043758392333984375, -0.040358543395996094, -0.03695869445800781, -0.03355884552001953, -0.03015899658203125, -0.02675914764404297, -0.023359298706054688, -0.019959449768066406, -0.016559600830078125, -0.013159751892089844, -0.009759902954101562, -0.006360054016113281, -0.002960205078125, 0.00043964385986328125, 0.0038394927978515625, 0.007239341735839844, 0.010639190673828125, 0.014039039611816406, 0.017438888549804688, 0.02083873748779297, 0.02423858642578125, 0.02763843536376953, 0.031038284301757812, 0.034438133239746094, 0.037837982177734375, 0.041237831115722656, 0.04463768005371094, 0.04803752899169922, 0.0514373779296875, 0.05483722686767578, 0.05823707580566406, 0.061636924743652344, 0.06503677368164062, 0.0684366226196289, 0.07183647155761719, 0.07523632049560547, 0.07863616943359375, 0.08203601837158203, 0.08543586730957031, 0.0888357162475586, 0.09223556518554688, 0.09563541412353516, 0.09903526306152344, 0.10243511199951172, 0.1058349609375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 4.0, 6.0, 5.0, 7.0, 10.0, 16.0, 22.0, 21.0, 29.0, 35.0, 43.0, 39.0, 57.0, 55.0, 79.0, 96.0, 86.0, 72.0, 59.0, 50.0, 45.0, 30.0, 34.0, 23.0, 16.0, 20.0, 13.0, 6.0, 9.0, 4.0, 3.0, 6.0, 1.0, 2.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.189678192138672e-05, -7.906835526227951e-05, -7.62399286031723e-05, -7.34115019440651e-05, -7.058307528495789e-05, -6.775464862585068e-05, -6.492622196674347e-05, -6.209779530763626e-05, -5.926936864852905e-05, -5.6440941989421844e-05, -5.3612515330314636e-05, -5.078408867120743e-05, -4.795566201210022e-05, -4.512723535299301e-05, -4.22988086938858e-05, -3.9470382034778595e-05, -3.664195537567139e-05, -3.381352871656418e-05, -3.098510205745697e-05, -2.8156675398349762e-05, -2.5328248739242554e-05, -2.2499822080135345e-05, -1.9671395421028137e-05, -1.684296876192093e-05, -1.401454210281372e-05, -1.1186115443706512e-05, -8.357688784599304e-06, -5.529262125492096e-06, -2.7008354663848877e-06, 1.2759119272232056e-07, 2.956017851829529e-06, 5.784444510936737e-06, 8.612871170043945e-06, 1.1441297829151154e-05, 1.4269724488258362e-05, 1.709815114736557e-05, 1.992657780647278e-05, 2.2755004465579987e-05, 2.5583431124687195e-05, 2.8411857783794403e-05, 3.124028444290161e-05, 3.406871110200882e-05, 3.689713776111603e-05, 3.9725564420223236e-05, 4.2553991079330444e-05, 4.538241773843765e-05, 4.821084439754486e-05, 5.103927105665207e-05, 5.386769771575928e-05, 5.6696124374866486e-05, 5.9524551033973694e-05, 6.23529776930809e-05, 6.518140435218811e-05, 6.800983101129532e-05, 7.083825767040253e-05, 7.366668432950974e-05, 7.649511098861694e-05, 7.932353764772415e-05, 8.215196430683136e-05, 8.498039096593857e-05, 8.780881762504578e-05, 9.063724428415298e-05, 9.346567094326019e-05, 9.62940976023674e-05, 9.912252426147461e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 5.0, 1.0, 3.0, 7.0, 8.0, 3.0, 14.0, 23.0, 23.0, 32.0, 53.0, 69.0, 121.0, 174.0, 282.0, 492.0, 934.0, 2063.0, 4792.0, 12981.0, 43507.0, 193557.0, 573737.0, 159208.0, 36922.0, 11416.0, 4227.0, 1771.0, 894.0, 476.0, 271.0, 163.0, 109.0, 57.0, 50.0, 34.0, 21.0, 15.0, 12.0, 10.0, 7.0, 7.0, 3.0, 6.0, 4.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08184814453125, -0.07875251770019531, -0.07565689086914062, -0.07256126403808594, -0.06946563720703125, -0.06637001037597656, -0.06327438354492188, -0.06017875671386719, -0.0570831298828125, -0.05398750305175781, -0.050891876220703125, -0.04779624938964844, -0.04470062255859375, -0.04160499572753906, -0.038509368896484375, -0.03541374206542969, -0.032318115234375, -0.029222488403320312, -0.026126861572265625, -0.023031234741210938, -0.01993560791015625, -0.016839981079101562, -0.013744354248046875, -0.010648727416992188, -0.0075531005859375, -0.0044574737548828125, -0.001361846923828125, 0.0017337799072265625, 0.00482940673828125, 0.007925033569335938, 0.011020660400390625, 0.014116287231445312, 0.0172119140625, 0.020307540893554688, 0.023403167724609375, 0.026498794555664062, 0.02959442138671875, 0.03269004821777344, 0.035785675048828125, 0.03888130187988281, 0.0419769287109375, 0.04507255554199219, 0.048168182373046875, 0.05126380920410156, 0.05435943603515625, 0.05745506286621094, 0.060550689697265625, 0.06364631652832031, 0.066741943359375, 0.06983757019042969, 0.07293319702148438, 0.07602882385253906, 0.07912445068359375, 0.08222007751464844, 0.08531570434570312, 0.08841133117675781, 0.0915069580078125, 0.09460258483886719, 0.09769821166992188, 0.10079383850097656, 0.10388946533203125, 0.10698509216308594, 0.11008071899414062, 0.11317634582519531, 0.11627197265625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 5.0, 2.0, 7.0, 5.0, 17.0, 10.0, 15.0, 19.0, 27.0, 36.0, 36.0, 44.0, 62.0, 78.0, 105.0, 89.0, 88.0, 79.0, 51.0, 40.0, 41.0, 28.0, 25.0, 18.0, 17.0, 10.0, 11.0, 11.0, 6.0, 4.0, 5.0, 4.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06231689453125, -0.060210227966308594, -0.05810356140136719, -0.05599689483642578, -0.053890228271484375, -0.05178356170654297, -0.04967689514160156, -0.047570228576660156, -0.04546356201171875, -0.043356895446777344, -0.04125022888183594, -0.03914356231689453, -0.037036895751953125, -0.03493022918701172, -0.03282356262207031, -0.030716896057128906, -0.0286102294921875, -0.026503562927246094, -0.024396896362304688, -0.02229022979736328, -0.020183563232421875, -0.01807689666748047, -0.015970230102539062, -0.013863563537597656, -0.01175689697265625, -0.009650230407714844, -0.0075435638427734375, -0.005436897277832031, -0.003330230712890625, -0.0012235641479492188, 0.0008831024169921875, 0.0029897689819335938, 0.005096435546875, 0.007203102111816406, 0.009309768676757812, 0.011416435241699219, 0.013523101806640625, 0.01562976837158203, 0.017736434936523438, 0.019843101501464844, 0.02194976806640625, 0.024056434631347656, 0.026163101196289062, 0.02826976776123047, 0.030376434326171875, 0.03248310089111328, 0.03458976745605469, 0.036696434020996094, 0.0388031005859375, 0.040909767150878906, 0.04301643371582031, 0.04512310028076172, 0.047229766845703125, 0.04933643341064453, 0.05144309997558594, 0.053549766540527344, 0.05565643310546875, 0.057763099670410156, 0.05986976623535156, 0.06197643280029297, 0.06408309936523438, 0.06618976593017578, 0.06829643249511719, 0.0704030990600586, 0.072509765625]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 8.0, 6.0, 17.0, 19.0, 38.0, 50.0, 97.0, 122.0, 129.0, 122.0, 133.0, 88.0, 88.0, 35.0, 22.0, 9.0, 13.0, 8.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5888552665710449, -0.5526053309440613, -0.5163554549217224, -0.48010551929473877, -0.4438556134700775, -0.40760570764541626, -0.3713557720184326, -0.33510586619377136, -0.2988559603691101, -0.26260605454444885, -0.2263561338186264, -0.19010621309280396, -0.1538563072681427, -0.11760640144348145, -0.081356480717659, -0.04510655999183655, -0.008856654167175293, 0.02739325910806656, 0.06364317238330841, 0.09989308565855026, 0.13614299893379211, 0.17239290475845337, 0.20864282548427582, 0.24489274621009827, 0.2811426520347595, 0.3173925578594208, 0.35364246368408203, 0.3898923993110657, 0.42614230513572693, 0.4623922109603882, 0.4986421465873718, 0.5348920822143555, 0.5711419582366943, 0.607391893863678, 0.6436417698860168, 0.6798917055130005, 0.7161415815353394, 0.752391517162323, 0.7886414527893066, 0.8248913288116455, 0.8611412644386292, 0.8973912000656128, 0.9336410760879517, 0.9698910117149353, 1.006140947341919, 1.0423908233642578, 1.0786406993865967, 1.114890694618225, 1.151140570640564, 1.1873904466629028, 1.2236404418945312, 1.2598903179168701, 1.296140193939209, 1.3323900699615479, 1.3686400651931763, 1.4048899412155151, 1.4411399364471436, 1.4773898124694824, 1.5136398077011108, 1.5498896837234497, 1.5861395597457886, 1.622389554977417, 1.6586394309997559, 1.6948893070220947, 1.7311391830444336]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 9.0, 4.0, 7.0, 12.0, 14.0, 16.0, 18.0, 16.0, 24.0, 34.0, 35.0, 34.0, 47.0, 34.0, 43.0, 47.0, 44.0, 47.0, 47.0, 50.0, 52.0, 41.0, 35.0, 43.0, 36.0, 36.0, 30.0, 31.0, 22.0, 20.0, 17.0, 14.0, 10.0, 12.0, 7.0, 7.0, 2.0, 3.0, 1.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7124967575073242, -0.6862809062004089, -0.6600650548934937, -0.6338492631912231, -0.6076334118843079, -0.5814175605773926, -0.5552017688751221, -0.5289859175682068, -0.5027700662612915, -0.4765542149543762, -0.4503383934497833, -0.42412257194519043, -0.39790672063827515, -0.37169086933135986, -0.34547504782676697, -0.3192592263221741, -0.2930433750152588, -0.2668275237083435, -0.2406117022037506, -0.21439586579799652, -0.18818002939224243, -0.16196419298648834, -0.13574835658073425, -0.10953252017498016, -0.08331668376922607, -0.057100847363471985, -0.030885010957717896, -0.004669174551963806, 0.021546661853790283, 0.04776249825954437, 0.07397833466529846, 0.10019417107105255, 0.12640994787216187, 0.15262578427791595, 0.17884162068367004, 0.20505745708942413, 0.23127329349517822, 0.2574891448020935, 0.2837049663066864, 0.3099207878112793, 0.3361366391181946, 0.36235249042510986, 0.38856831192970276, 0.41478413343429565, 0.44099998474121094, 0.4672158360481262, 0.4934316575527191, 0.519647479057312, 0.5458633303642273, 0.5720791816711426, 0.5982949733734131, 0.6245108246803284, 0.6507266759872437, 0.6769425272941589, 0.7031583786010742, 0.7293741703033447, 0.75559002161026, 0.7818058729171753, 0.8080216646194458, 0.8342375159263611, 0.8604533672332764, 0.8866692185401917, 0.9128850698471069, 0.9391008615493774, 0.9653167128562927]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 9.0, 3.0, 4.0, 3.0, 14.0, 17.0, 17.0, 39.0, 60.0, 85.0, 122.0, 206.0, 382.0, 609.0, 1221.0, 2438.0, 5267.0, 13525.0, 42526.0, 199647.0, 3392947.0, 434695.0, 67255.0, 19272.0, 7111.0, 3194.0, 1533.0, 849.0, 494.0, 280.0, 178.0, 85.0, 60.0, 36.0, 43.0, 22.0, 16.0, 11.0, 6.0, 2.0, 1.0, 3.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1527099609375, -0.14788818359375, -0.14306640625, -0.13824462890625, -0.1334228515625, -0.12860107421875, -0.123779296875, -0.11895751953125, -0.1141357421875, -0.10931396484375, -0.1044921875, -0.09967041015625, -0.0948486328125, -0.09002685546875, -0.085205078125, -0.08038330078125, -0.0755615234375, -0.07073974609375, -0.06591796875, -0.06109619140625, -0.0562744140625, -0.05145263671875, -0.046630859375, -0.04180908203125, -0.0369873046875, -0.03216552734375, -0.02734375, -0.02252197265625, -0.0177001953125, -0.01287841796875, -0.008056640625, -0.00323486328125, 0.0015869140625, 0.00640869140625, 0.01123046875, 0.01605224609375, 0.0208740234375, 0.02569580078125, 0.030517578125, 0.03533935546875, 0.0401611328125, 0.04498291015625, 0.0498046875, 0.05462646484375, 0.0594482421875, 0.06427001953125, 0.069091796875, 0.07391357421875, 0.0787353515625, 0.08355712890625, 0.08837890625, 0.09320068359375, 0.0980224609375, 0.10284423828125, 0.107666015625, 0.11248779296875, 0.1173095703125, 0.12213134765625, 0.126953125, 0.13177490234375, 0.1365966796875, 0.14141845703125, 0.146240234375, 0.15106201171875, 0.1558837890625]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 5.0, 6.0, 10.0, 12.0, 20.0, 16.0, 36.0, 52.0, 51.0, 76.0, 76.0, 99.0, 93.0, 69.0, 78.0, 75.0, 59.0, 51.0, 31.0, 31.0, 18.0, 19.0, 4.0, 9.0, 2.0, 5.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05194091796875, -0.050345420837402344, -0.04874992370605469, -0.04715442657470703, -0.045558929443359375, -0.04396343231201172, -0.04236793518066406, -0.040772438049316406, -0.03917694091796875, -0.037581443786621094, -0.03598594665527344, -0.03439044952392578, -0.032794952392578125, -0.03119945526123047, -0.029603958129882812, -0.028008460998535156, -0.0264129638671875, -0.024817466735839844, -0.023221969604492188, -0.02162647247314453, -0.020030975341796875, -0.01843547821044922, -0.016839981079101562, -0.015244483947753906, -0.01364898681640625, -0.012053489685058594, -0.010457992553710938, -0.008862495422363281, -0.007266998291015625, -0.005671501159667969, -0.0040760040283203125, -0.0024805068969726562, -0.000885009765625, 0.0007104873657226562, 0.0023059844970703125, 0.0039014816284179688, 0.005496978759765625, 0.007092475891113281, 0.008687973022460938, 0.010283470153808594, 0.01187896728515625, 0.013474464416503906, 0.015069961547851562, 0.01666545867919922, 0.018260955810546875, 0.01985645294189453, 0.021451950073242188, 0.023047447204589844, 0.0246429443359375, 0.026238441467285156, 0.027833938598632812, 0.02942943572998047, 0.031024932861328125, 0.03262042999267578, 0.03421592712402344, 0.035811424255371094, 0.03740692138671875, 0.039002418518066406, 0.04059791564941406, 0.04219341278076172, 0.043788909912109375, 0.04538440704345703, 0.04697990417480469, 0.048575401306152344, 0.0501708984375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 7.0, 4.0, 9.0, 11.0, 10.0, 21.0, 28.0, 46.0, 72.0, 93.0, 184.0, 342.0, 685.0, 1639.0, 3952.0, 11387.0, 39201.0, 175362.0, 2923299.0, 893931.0, 104108.0, 26256.0, 8107.0, 2994.0, 1213.0, 560.0, 306.0, 170.0, 88.0, 75.0, 34.0, 21.0, 18.0, 16.0, 10.0, 5.0, 9.0, 5.0, 3.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1719970703125, -0.1658191680908203, -0.15964126586914062, -0.15346336364746094, -0.14728546142578125, -0.14110755920410156, -0.13492965698242188, -0.1287517547607422, -0.1225738525390625, -0.11639595031738281, -0.11021804809570312, -0.10404014587402344, -0.09786224365234375, -0.09168434143066406, -0.08550643920898438, -0.07932853698730469, -0.073150634765625, -0.06697273254394531, -0.060794830322265625, -0.05461692810058594, -0.04843902587890625, -0.04226112365722656, -0.036083221435546875, -0.029905319213867188, -0.0237274169921875, -0.017549514770507812, -0.011371612548828125, -0.0051937103271484375, 0.00098419189453125, 0.0071620941162109375, 0.013339996337890625, 0.019517898559570312, 0.02569580078125, 0.03187370300292969, 0.038051605224609375, 0.04422950744628906, 0.05040740966796875, 0.05658531188964844, 0.06276321411132812, 0.06894111633300781, 0.0751190185546875, 0.08129692077636719, 0.08747482299804688, 0.09365272521972656, 0.09983062744140625, 0.10600852966308594, 0.11218643188476562, 0.11836433410644531, 0.124542236328125, 0.1307201385498047, 0.13689804077148438, 0.14307594299316406, 0.14925384521484375, 0.15543174743652344, 0.16160964965820312, 0.1677875518798828, 0.1739654541015625, 0.1801433563232422, 0.18632125854492188, 0.19249916076660156, 0.19867706298828125, 0.20485496520996094, 0.21103286743164062, 0.2172107696533203, 0.223388671875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 4.0, 1.0, 5.0, 7.0, 11.0, 13.0, 15.0, 18.0, 35.0, 47.0, 48.0, 91.0, 172.0, 276.0, 690.0, 1403.0, 531.0, 250.0, 145.0, 87.0, 66.0, 43.0, 29.0, 30.0, 17.0, 15.0, 7.0, 5.0, 9.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.049591064453125, -0.047274112701416016, -0.04495716094970703, -0.04264020919799805, -0.04032325744628906, -0.03800630569458008, -0.035689353942871094, -0.03337240219116211, -0.031055450439453125, -0.02873849868774414, -0.026421546936035156, -0.024104595184326172, -0.021787643432617188, -0.019470691680908203, -0.01715373992919922, -0.014836788177490234, -0.01251983642578125, -0.010202884674072266, -0.007885932922363281, -0.005568981170654297, -0.0032520294189453125, -0.0009350776672363281, 0.0013818740844726562, 0.0036988258361816406, 0.006015777587890625, 0.00833272933959961, 0.010649681091308594, 0.012966632843017578, 0.015283584594726562, 0.017600536346435547, 0.01991748809814453, 0.022234439849853516, 0.0245513916015625, 0.026868343353271484, 0.02918529510498047, 0.03150224685668945, 0.03381919860839844, 0.03613615036010742, 0.038453102111816406, 0.04077005386352539, 0.043087005615234375, 0.04540395736694336, 0.047720909118652344, 0.05003786087036133, 0.05235481262207031, 0.0546717643737793, 0.05698871612548828, 0.059305667877197266, 0.06162261962890625, 0.06393957138061523, 0.06625652313232422, 0.0685734748840332, 0.07089042663574219, 0.07320737838745117, 0.07552433013916016, 0.07784128189086914, 0.08015823364257812, 0.08247518539428711, 0.0847921371459961, 0.08710908889770508, 0.08942604064941406, 0.09174299240112305, 0.09405994415283203, 0.09637689590454102, 0.09869384765625]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 15.0, 21.0, 42.0, 66.0, 97.0, 147.0, 142.0, 158.0, 127.0, 86.0, 53.0, 26.0, 18.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3175918459892273, -0.29725760221481323, -0.27692335844039917, -0.2565890848636627, -0.23625484108924866, -0.2159205973148346, -0.19558633863925934, -0.17525207996368408, -0.15491783618927002, -0.13458359241485596, -0.1142493337392807, -0.09391508251428604, -0.07358083128929138, -0.05324658006429672, -0.03291232883930206, -0.012578070163726807, 0.007756173610687256, 0.028090424835681915, 0.048424676060676575, 0.06875892728567123, 0.0890931785106659, 0.10942742973566055, 0.1297616809606552, 0.15009593963623047, 0.17043018341064453, 0.1907644271850586, 0.21109868586063385, 0.2314329445362091, 0.25176718831062317, 0.27210143208503723, 0.2924357056617737, 0.31276994943618774, 0.3331042528152466, 0.35343849658966064, 0.3737727403640747, 0.39410701394081116, 0.4144412577152252, 0.4347755014896393, 0.45510977506637573, 0.4754440188407898, 0.49577826261520386, 0.5161125063896179, 0.536446750164032, 0.556780993938446, 0.5771152973175049, 0.597449541091919, 0.617783784866333, 0.6381180286407471, 0.6584522724151611, 0.6787865161895752, 0.6991207599639893, 0.7194550037384033, 0.7397892475128174, 0.7601235508918762, 0.7804577946662903, 0.8007920384407043, 0.8211262822151184, 0.8414605259895325, 0.8617947697639465, 0.8821290135383606, 0.9024633169174194, 0.9227975606918335, 0.9431318044662476, 0.9634660482406616, 0.9838002920150757]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 7.0, 9.0, 10.0, 8.0, 12.0, 17.0, 12.0, 25.0, 32.0, 35.0, 38.0, 30.0, 32.0, 41.0, 36.0, 40.0, 54.0, 50.0, 32.0, 57.0, 46.0, 40.0, 49.0, 36.0, 48.0, 45.0, 25.0, 23.0, 27.0, 17.0, 19.0, 16.0, 12.0, 9.0, 6.0, 3.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0], "bins": [-0.3442193269729614, -0.33554336428642273, -0.32686740159988403, -0.3181914687156677, -0.30951550602912903, -0.30083954334259033, -0.292163610458374, -0.2834876477718353, -0.27481168508529663, -0.26613572239875793, -0.25745975971221924, -0.24878382682800293, -0.24010786414146423, -0.23143190145492554, -0.22275595366954803, -0.21408000588417053, -0.20540404319763184, -0.19672808051109314, -0.18805213272571564, -0.17937618494033813, -0.17070022225379944, -0.16202425956726074, -0.15334831178188324, -0.14467236399650574, -0.13599640130996704, -0.12732043862342834, -0.11864449083805084, -0.10996853560209274, -0.10129258036613464, -0.09261662513017654, -0.08394066989421844, -0.07526471465826035, -0.06658875942230225, -0.05791280418634415, -0.04923684895038605, -0.04056089371442795, -0.03188493847846985, -0.02320898324251175, -0.01453302800655365, -0.0058570727705955505, 0.002818882465362549, 0.011494837701320648, 0.020170792937278748, 0.028846748173236847, 0.037522703409194946, 0.046198658645153046, 0.054874613881111145, 0.06355056911706924, 0.07222652435302734, 0.08090247958898544, 0.08957843482494354, 0.09825439006090164, 0.10693034529685974, 0.11560630053281784, 0.12428225576877594, 0.13295820355415344, 0.14163416624069214, 0.15031012892723083, 0.15898607671260834, 0.16766202449798584, 0.17633798718452454, 0.18501394987106323, 0.19368989765644073, 0.20236584544181824, 0.21104180812835693]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 6.0, 3.0, 8.0, 7.0, 7.0, 5.0, 28.0, 29.0, 35.0, 51.0, 72.0, 111.0, 158.0, 261.0, 394.0, 642.0, 1113.0, 2057.0, 3755.0, 7232.0, 13841.0, 26361.0, 52453.0, 104190.0, 218777.0, 302925.0, 155556.0, 77121.0, 39264.0, 19695.0, 10126.0, 5343.0, 2887.0, 1604.0, 929.0, 571.0, 324.0, 201.0, 127.0, 95.0, 58.0, 39.0, 34.0, 19.0, 23.0, 6.0, 6.0, 10.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1070556640625, -0.10339927673339844, -0.09974288940429688, -0.09608650207519531, -0.09243011474609375, -0.08877372741699219, -0.08511734008789062, -0.08146095275878906, -0.0778045654296875, -0.07414817810058594, -0.07049179077148438, -0.06683540344238281, -0.06317901611328125, -0.05952262878417969, -0.055866241455078125, -0.05220985412597656, -0.048553466796875, -0.04489707946777344, -0.041240692138671875, -0.03758430480957031, -0.03392791748046875, -0.030271530151367188, -0.026615142822265625, -0.022958755493164062, -0.0193023681640625, -0.015645980834960938, -0.011989593505859375, -0.008333206176757812, -0.00467681884765625, -0.0010204315185546875, 0.002635955810546875, 0.0062923431396484375, 0.00994873046875, 0.013605117797851562, 0.017261505126953125, 0.020917892456054688, 0.02457427978515625, 0.028230667114257812, 0.031887054443359375, 0.03554344177246094, 0.0391998291015625, 0.04285621643066406, 0.046512603759765625, 0.05016899108886719, 0.05382537841796875, 0.05748176574707031, 0.061138153076171875, 0.06479454040527344, 0.068450927734375, 0.07210731506347656, 0.07576370239257812, 0.07942008972167969, 0.08307647705078125, 0.08673286437988281, 0.09038925170898438, 0.09404563903808594, 0.0977020263671875, 0.10135841369628906, 0.10501480102539062, 0.10867118835449219, 0.11232757568359375, 0.11598396301269531, 0.11964035034179688, 0.12329673767089844, 0.126953125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 10.0, 8.0, 10.0, 11.0, 20.0, 23.0, 33.0, 52.0, 54.0, 63.0, 63.0, 72.0, 65.0, 80.0, 86.0, 71.0, 71.0, 53.0, 40.0, 30.0, 25.0, 21.0, 16.0, 13.0, 7.0, 5.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0484619140625, -0.046901702880859375, -0.04534149169921875, -0.043781280517578125, -0.0422210693359375, -0.040660858154296875, -0.03910064697265625, -0.037540435791015625, -0.035980224609375, -0.034420013427734375, -0.03285980224609375, -0.031299591064453125, -0.0297393798828125, -0.028179168701171875, -0.02661895751953125, -0.025058746337890625, -0.02349853515625, -0.021938323974609375, -0.02037811279296875, -0.018817901611328125, -0.0172576904296875, -0.015697479248046875, -0.01413726806640625, -0.012577056884765625, -0.011016845703125, -0.009456634521484375, -0.00789642333984375, -0.006336212158203125, -0.0047760009765625, -0.003215789794921875, -0.00165557861328125, -9.5367431640625e-05, 0.00146484375, 0.003025054931640625, 0.00458526611328125, 0.006145477294921875, 0.0077056884765625, 0.009265899658203125, 0.01082611083984375, 0.012386322021484375, 0.013946533203125, 0.015506744384765625, 0.01706695556640625, 0.018627166748046875, 0.0201873779296875, 0.021747589111328125, 0.02330780029296875, 0.024868011474609375, 0.02642822265625, 0.027988433837890625, 0.02954864501953125, 0.031108856201171875, 0.0326690673828125, 0.034229278564453125, 0.03578948974609375, 0.037349700927734375, 0.038909912109375, 0.040470123291015625, 0.04203033447265625, 0.043590545654296875, 0.0451507568359375, 0.046710968017578125, 0.04827117919921875, 0.049831390380859375, 0.0513916015625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 8.0, 6.0, 8.0, 8.0, 28.0, 20.0, 31.0, 34.0, 66.0, 71.0, 122.0, 167.0, 238.0, 337.0, 502.0, 837.0, 1442.0, 3538.0, 12658.0, 56414.0, 255253.0, 529308.0, 143181.0, 31100.0, 7432.0, 2409.0, 1186.0, 635.0, 437.0, 325.0, 211.0, 164.0, 111.0, 88.0, 58.0, 39.0, 28.0, 26.0, 15.0, 7.0, 6.0, 9.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2066650390625, -0.20046043395996094, -0.19425582885742188, -0.1880512237548828, -0.18184661865234375, -0.1756420135498047, -0.16943740844726562, -0.16323280334472656, -0.1570281982421875, -0.15082359313964844, -0.14461898803710938, -0.1384143829345703, -0.13220977783203125, -0.1260051727294922, -0.11980056762695312, -0.11359596252441406, -0.107391357421875, -0.10118675231933594, -0.09498214721679688, -0.08877754211425781, -0.08257293701171875, -0.07636833190917969, -0.07016372680664062, -0.06395912170410156, -0.0577545166015625, -0.05154991149902344, -0.045345306396484375, -0.03914070129394531, -0.03293609619140625, -0.026731491088867188, -0.020526885986328125, -0.014322280883789062, -0.00811767578125, -0.0019130706787109375, 0.004291534423828125, 0.010496139526367188, 0.01670074462890625, 0.022905349731445312, 0.029109954833984375, 0.03531455993652344, 0.0415191650390625, 0.04772377014160156, 0.053928375244140625, 0.06013298034667969, 0.06633758544921875, 0.07254219055175781, 0.07874679565429688, 0.08495140075683594, 0.091156005859375, 0.09736061096191406, 0.10356521606445312, 0.10976982116699219, 0.11597442626953125, 0.12217903137207031, 0.12838363647460938, 0.13458824157714844, 0.1407928466796875, 0.14699745178222656, 0.15320205688476562, 0.1594066619873047, 0.16561126708984375, 0.1718158721923828, 0.17802047729492188, 0.18422508239746094, 0.1904296875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 8.0, 7.0, 4.0, 9.0, 9.0, 20.0, 19.0, 18.0, 25.0, 37.0, 29.0, 42.0, 35.0, 44.0, 64.0, 44.0, 56.0, 45.0, 61.0, 56.0, 60.0, 45.0, 29.0, 31.0, 36.0, 31.0, 27.0, 22.0, 15.0, 13.0, 20.0, 13.0, 8.0, 9.0, 8.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.18798828125, -0.18281173706054688, -0.17763519287109375, -0.17245864868164062, -0.1672821044921875, -0.16210556030273438, -0.15692901611328125, -0.15175247192382812, -0.146575927734375, -0.14139938354492188, -0.13622283935546875, -0.13104629516601562, -0.1258697509765625, -0.12069320678710938, -0.11551666259765625, -0.11034011840820312, -0.10516357421875, -0.09998703002929688, -0.09481048583984375, -0.08963394165039062, -0.0844573974609375, -0.07928085327148438, -0.07410430908203125, -0.06892776489257812, -0.063751220703125, -0.058574676513671875, -0.05339813232421875, -0.048221588134765625, -0.0430450439453125, -0.037868499755859375, -0.03269195556640625, -0.027515411376953125, -0.0223388671875, -0.017162322998046875, -0.01198577880859375, -0.006809234619140625, -0.0016326904296875, 0.003543853759765625, 0.00872039794921875, 0.013896942138671875, 0.019073486328125, 0.024250030517578125, 0.02942657470703125, 0.034603118896484375, 0.0397796630859375, 0.044956207275390625, 0.05013275146484375, 0.055309295654296875, 0.06048583984375, 0.06566238403320312, 0.07083892822265625, 0.07601547241210938, 0.0811920166015625, 0.08636856079101562, 0.09154510498046875, 0.09672164916992188, 0.101898193359375, 0.10707473754882812, 0.11225128173828125, 0.11742782592773438, 0.1226043701171875, 0.12778091430664062, 0.13295745849609375, 0.13813400268554688, 0.143310546875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 1.0, 5.0, 5.0, 9.0, 9.0, 9.0, 22.0, 23.0, 28.0, 47.0, 43.0, 76.0, 107.0, 168.0, 253.0, 381.0, 701.0, 1302.0, 3296.0, 12837.0, 148238.0, 810505.0, 57947.0, 7511.0, 2283.0, 1107.0, 596.0, 358.0, 221.0, 142.0, 79.0, 75.0, 52.0, 26.0, 17.0, 21.0, 21.0, 10.0, 5.0, 7.0, 1.0, 2.0, 3.0, 5.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2490234375, -0.24053573608398438, -0.23204803466796875, -0.22356033325195312, -0.2150726318359375, -0.20658493041992188, -0.19809722900390625, -0.18960952758789062, -0.181121826171875, -0.17263412475585938, -0.16414642333984375, -0.15565872192382812, -0.1471710205078125, -0.13868331909179688, -0.13019561767578125, -0.12170791625976562, -0.11322021484375, -0.10473251342773438, -0.09624481201171875, -0.08775711059570312, -0.0792694091796875, -0.07078170776367188, -0.06229400634765625, -0.053806304931640625, -0.045318603515625, -0.036830902099609375, -0.02834320068359375, -0.019855499267578125, -0.0113677978515625, -0.002880096435546875, 0.00560760498046875, 0.014095306396484375, 0.0225830078125, 0.031070709228515625, 0.03955841064453125, 0.048046112060546875, 0.0565338134765625, 0.06502151489257812, 0.07350921630859375, 0.08199691772460938, 0.090484619140625, 0.09897232055664062, 0.10746002197265625, 0.11594772338867188, 0.1244354248046875, 0.13292312622070312, 0.14141082763671875, 0.14989852905273438, 0.15838623046875, 0.16687393188476562, 0.17536163330078125, 0.18384933471679688, 0.1923370361328125, 0.20082473754882812, 0.20931243896484375, 0.21780014038085938, 0.226287841796875, 0.23477554321289062, 0.24326324462890625, 0.2517509460449219, 0.2602386474609375, 0.2687263488769531, 0.27721405029296875, 0.2857017517089844, 0.294189453125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 8.0, 13.0, 12.0, 20.0, 35.0, 31.0, 40.0, 54.0, 65.0, 86.0, 93.0, 97.0, 93.0, 75.0, 57.0, 52.0, 51.0, 36.0, 25.0, 16.0, 13.0, 9.0, 5.0, 4.0, 3.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00011366605758666992, -0.00011036824434995651, -0.0001070704311132431, -0.0001037726178765297, -0.00010047480463981628, -9.717699140310287e-05, -9.387917816638947e-05, -9.058136492967606e-05, -8.728355169296265e-05, -8.398573845624924e-05, -8.068792521953583e-05, -7.739011198282242e-05, -7.409229874610901e-05, -7.07944855093956e-05, -6.749667227268219e-05, -6.419885903596878e-05, -6.090104579925537e-05, -5.760323256254196e-05, -5.430541932582855e-05, -5.100760608911514e-05, -4.7709792852401733e-05, -4.4411979615688324e-05, -4.1114166378974915e-05, -3.7816353142261505e-05, -3.4518539905548096e-05, -3.1220726668834686e-05, -2.7922913432121277e-05, -2.4625100195407867e-05, -2.1327286958694458e-05, -1.802947372198105e-05, -1.473166048526764e-05, -1.143384724855423e-05, -8.13603401184082e-06, -4.838220775127411e-06, -1.5404075384140015e-06, 1.757405698299408e-06, 5.055218935012817e-06, 8.353032171726227e-06, 1.1650845408439636e-05, 1.4948658645153046e-05, 1.8246471881866455e-05, 2.1544285118579865e-05, 2.4842098355293274e-05, 2.8139911592006683e-05, 3.143772482872009e-05, 3.47355380654335e-05, 3.803335130214691e-05, 4.133116453886032e-05, 4.462897777557373e-05, 4.792679101228714e-05, 5.122460424900055e-05, 5.452241748571396e-05, 5.782023072242737e-05, 6.111804395914078e-05, 6.441585719585419e-05, 6.77136704325676e-05, 7.1011483669281e-05, 7.430929690599442e-05, 7.760711014270782e-05, 8.090492337942123e-05, 8.420273661613464e-05, 8.750054985284805e-05, 9.079836308956146e-05, 9.409617632627487e-05, 9.739398956298828e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 2.0, 6.0, 9.0, 7.0, 13.0, 17.0, 28.0, 33.0, 69.0, 100.0, 215.0, 402.0, 963.0, 2348.0, 7991.0, 65313.0, 854538.0, 101672.0, 10066.0, 2750.0, 1014.0, 427.0, 242.0, 124.0, 76.0, 39.0, 30.0, 16.0, 10.0, 8.0, 6.0, 5.0, 7.0, 1.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.28466796875, -0.2759284973144531, -0.26718902587890625, -0.2584495544433594, -0.2497100830078125, -0.24097061157226562, -0.23223114013671875, -0.22349166870117188, -0.214752197265625, -0.20601272583007812, -0.19727325439453125, -0.18853378295898438, -0.1797943115234375, -0.17105484008789062, -0.16231536865234375, -0.15357589721679688, -0.14483642578125, -0.13609695434570312, -0.12735748291015625, -0.11861801147460938, -0.1098785400390625, -0.10113906860351562, -0.09239959716796875, -0.08366012573242188, -0.074920654296875, -0.06618118286132812, -0.05744171142578125, -0.048702239990234375, -0.0399627685546875, -0.031223297119140625, -0.02248382568359375, -0.013744354248046875, -0.0050048828125, 0.003734588623046875, 0.01247406005859375, 0.021213531494140625, 0.0299530029296875, 0.038692474365234375, 0.04743194580078125, 0.056171417236328125, 0.064910888671875, 0.07365036010742188, 0.08238983154296875, 0.09112930297851562, 0.0998687744140625, 0.10860824584960938, 0.11734771728515625, 0.12608718872070312, 0.13482666015625, 0.14356613159179688, 0.15230560302734375, 0.16104507446289062, 0.1697845458984375, 0.17852401733398438, 0.18726348876953125, 0.19600296020507812, 0.204742431640625, 0.21348190307617188, 0.22222137451171875, 0.23096084594726562, 0.2397003173828125, 0.24843978881835938, 0.25717926025390625, 0.2659187316894531, 0.274658203125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 11.0, 10.0, 13.0, 29.0, 33.0, 49.0, 63.0, 81.0, 131.0, 136.0, 129.0, 108.0, 65.0, 45.0, 21.0, 18.0, 15.0, 6.0, 3.0, 2.0, 9.0, 5.0, 3.0, 2.0, 1.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1107177734375, -0.10668182373046875, -0.1026458740234375, -0.09860992431640625, -0.094573974609375, -0.09053802490234375, -0.0865020751953125, -0.08246612548828125, -0.07843017578125, -0.07439422607421875, -0.0703582763671875, -0.06632232666015625, -0.062286376953125, -0.05825042724609375, -0.0542144775390625, -0.05017852783203125, -0.046142578125, -0.04210662841796875, -0.0380706787109375, -0.03403472900390625, -0.029998779296875, -0.02596282958984375, -0.0219268798828125, -0.01789093017578125, -0.01385498046875, -0.00981903076171875, -0.0057830810546875, -0.00174713134765625, 0.002288818359375, 0.00632476806640625, 0.0103607177734375, 0.01439666748046875, 0.0184326171875, 0.02246856689453125, 0.0265045166015625, 0.03054046630859375, 0.034576416015625, 0.03861236572265625, 0.0426483154296875, 0.04668426513671875, 0.05072021484375, 0.05475616455078125, 0.0587921142578125, 0.06282806396484375, 0.066864013671875, 0.07089996337890625, 0.0749359130859375, 0.07897186279296875, 0.0830078125, 0.08704376220703125, 0.0910797119140625, 0.09511566162109375, 0.099151611328125, 0.10318756103515625, 0.1072235107421875, 0.11125946044921875, 0.11529541015625, 0.11933135986328125, 0.1233673095703125, 0.12740325927734375, 0.131439208984375, 0.13547515869140625, 0.1395111083984375, 0.14354705810546875, 0.1475830078125]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 2.0, 6.0, 16.0, 22.0, 47.0, 62.0, 111.0, 122.0, 146.0, 134.0, 112.0, 94.0, 51.0, 30.0, 16.0, 12.0, 6.0, 6.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4575613737106323, -1.4084463119506836, -1.3593312501907349, -1.3102161884307861, -1.261101245880127, -1.2119861841201782, -1.1628711223602295, -1.1137560606002808, -1.064640998840332, -1.0155259370803833, -0.9664108753204346, -0.9172958731651306, -0.8681808114051819, -0.8190657496452332, -0.7699507474899292, -0.7208356857299805, -0.6717206239700317, -0.622605562210083, -0.5734905004501343, -0.5243754982948303, -0.4752604365348816, -0.42614537477493286, -0.3770303428173065, -0.3279153108596802, -0.27880024909973145, -0.2296852022409439, -0.18057015538215637, -0.13145510852336884, -0.0823400616645813, -0.03322501480579376, 0.015890032052993774, 0.06500506401062012, 0.1141200065612793, 0.16323505342006683, 0.21235010027885437, 0.2614651322364807, 0.31058019399642944, 0.3596952557563782, 0.4088102877140045, 0.45792531967163086, 0.5070403814315796, 0.5561554431915283, 0.605270504951477, 0.654385507106781, 0.7035005688667297, 0.7526156306266785, 0.8017306327819824, 0.8508456945419312, 0.8999607563018799, 0.9490758180618286, 0.9981908798217773, 1.047305941581726, 1.0964210033416748, 1.145535945892334, 1.1946510076522827, 1.2437660694122314, 1.2928811311721802, 1.341996192932129, 1.3911112546920776, 1.4402263164520264, 1.4893412590026855, 1.5384563207626343, 1.587571382522583, 1.6366864442825317, 1.6858015060424805]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0, 4.0, 3.0, 6.0, 3.0, 9.0, 6.0, 14.0, 7.0, 17.0, 15.0, 25.0, 35.0, 22.0, 31.0, 40.0, 50.0, 41.0, 44.0, 43.0, 48.0, 43.0, 33.0, 62.0, 37.0, 44.0, 37.0, 31.0, 31.0, 29.0, 30.0, 23.0, 24.0, 22.0, 20.0, 12.0, 14.0, 5.0, 8.0, 5.0, 8.0, 6.0, 0.0, 5.0, 6.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.7968870997428894, -0.7721466422080994, -0.7474061846733093, -0.7226657271385193, -0.6979252696037292, -0.6731848120689392, -0.6484442949295044, -0.6237038373947144, -0.5989633798599243, -0.5742229223251343, -0.5494824647903442, -0.5247420072555542, -0.5000015497207642, -0.4752610921859741, -0.4505206048488617, -0.42578014731407166, -0.401039719581604, -0.37629926204681396, -0.3515588045120239, -0.3268183469772339, -0.30207788944244385, -0.2773374319076538, -0.2525969445705414, -0.22785648703575134, -0.2031160295009613, -0.17837557196617126, -0.15363511443138123, -0.12889464199543, -0.10415418446063995, -0.07941372692584991, -0.05467325448989868, -0.029932796955108643, -0.005192279815673828, 0.01954818144440651, 0.04428864270448685, 0.06902910768985748, 0.09376956522464752, 0.11851002275943756, 0.1432504951953888, 0.16799095273017883, 0.19273141026496887, 0.2174718677997589, 0.24221232533454895, 0.2669528126716614, 0.2916932702064514, 0.31643372774124146, 0.3411741852760315, 0.36591464281082153, 0.3906551003456116, 0.4153955578804016, 0.44013601541519165, 0.4648764729499817, 0.48961693048477173, 0.5143573880195618, 0.5390979051589966, 0.5638383626937866, 0.5885788202285767, 0.6133192777633667, 0.6380597352981567, 0.6628001928329468, 0.6875406503677368, 0.7122811079025269, 0.7370215654373169, 0.7617620229721069, 0.786502480506897]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 3.0, 6.0, 6.0, 17.0, 26.0, 29.0, 58.0, 87.0, 152.0, 251.0, 487.0, 795.0, 1475.0, 2772.0, 6032.0, 13171.0, 32216.0, 99163.0, 560890.0, 3123383.0, 249719.0, 61665.0, 22536.0, 9453.0, 4613.0, 2309.0, 1199.0, 700.0, 401.0, 255.0, 153.0, 88.0, 56.0, 41.0, 24.0, 15.0, 17.0, 10.0, 7.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12347412109375, -0.11895275115966797, -0.11443138122558594, -0.1099100112915039, -0.10538864135742188, -0.10086727142333984, -0.09634590148925781, -0.09182453155517578, -0.08730316162109375, -0.08278179168701172, -0.07826042175292969, -0.07373905181884766, -0.06921768188476562, -0.0646963119506836, -0.06017494201660156, -0.05565357208251953, -0.0511322021484375, -0.04661083221435547, -0.04208946228027344, -0.037568092346191406, -0.033046722412109375, -0.028525352478027344, -0.024003982543945312, -0.01948261260986328, -0.01496124267578125, -0.010439872741699219, -0.0059185028076171875, -0.0013971328735351562, 0.003124237060546875, 0.007645606994628906, 0.012166976928710938, 0.01668834686279297, 0.021209716796875, 0.02573108673095703, 0.030252456665039062, 0.034773826599121094, 0.039295196533203125, 0.043816566467285156, 0.04833793640136719, 0.05285930633544922, 0.05738067626953125, 0.06190204620361328, 0.06642341613769531, 0.07094478607177734, 0.07546615600585938, 0.0799875259399414, 0.08450889587402344, 0.08903026580810547, 0.0935516357421875, 0.09807300567626953, 0.10259437561035156, 0.1071157455444336, 0.11163711547851562, 0.11615848541259766, 0.12067985534667969, 0.12520122528076172, 0.12972259521484375, 0.13424396514892578, 0.1387653350830078, 0.14328670501708984, 0.14780807495117188, 0.1523294448852539, 0.15685081481933594, 0.16137218475341797, 0.1658935546875]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 4.0, 6.0, 4.0, 8.0, 7.0, 25.0, 16.0, 32.0, 34.0, 41.0, 58.0, 62.0, 68.0, 78.0, 74.0, 78.0, 80.0, 62.0, 47.0, 54.0, 36.0, 39.0, 21.0, 21.0, 13.0, 12.0, 6.0, 6.0, 8.0, 5.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.045074462890625, -0.04356813430786133, -0.042061805725097656, -0.040555477142333984, -0.03904914855957031, -0.03754281997680664, -0.03603649139404297, -0.0345301628112793, -0.033023834228515625, -0.03151750564575195, -0.03001117706298828, -0.02850484848022461, -0.026998519897460938, -0.025492191314697266, -0.023985862731933594, -0.022479534149169922, -0.02097320556640625, -0.019466876983642578, -0.017960548400878906, -0.016454219818115234, -0.014947891235351562, -0.01344156265258789, -0.011935234069824219, -0.010428905487060547, -0.008922576904296875, -0.007416248321533203, -0.005909919738769531, -0.004403591156005859, -0.0028972625732421875, -0.0013909339904785156, 0.00011539459228515625, 0.0016217231750488281, 0.0031280517578125, 0.004634380340576172, 0.006140708923339844, 0.007647037506103516, 0.009153366088867188, 0.01065969467163086, 0.012166023254394531, 0.013672351837158203, 0.015178680419921875, 0.016685009002685547, 0.01819133758544922, 0.01969766616821289, 0.021203994750976562, 0.022710323333740234, 0.024216651916503906, 0.025722980499267578, 0.02722930908203125, 0.028735637664794922, 0.030241966247558594, 0.031748294830322266, 0.03325462341308594, 0.03476095199584961, 0.03626728057861328, 0.03777360916137695, 0.039279937744140625, 0.0407862663269043, 0.04229259490966797, 0.04379892349243164, 0.04530525207519531, 0.046811580657958984, 0.048317909240722656, 0.04982423782348633, 0.05133056640625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 2.0, 4.0, 7.0, 3.0, 10.0, 9.0, 18.0, 29.0, 43.0, 48.0, 94.0, 143.0, 205.0, 326.0, 596.0, 1030.0, 2002.0, 3921.0, 8172.0, 18689.0, 45940.0, 134926.0, 598820.0, 2773088.0, 427433.0, 108982.0, 38877.0, 16027.0, 7246.0, 3444.0, 1752.0, 954.0, 512.0, 321.0, 170.0, 131.0, 99.0, 64.0, 42.0, 43.0, 20.0, 15.0, 13.0, 7.0, 4.0, 4.0, 5.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.15576171875, -0.15148353576660156, -0.14720535278320312, -0.1429271697998047, -0.13864898681640625, -0.1343708038330078, -0.13009262084960938, -0.12581443786621094, -0.1215362548828125, -0.11725807189941406, -0.11297988891601562, -0.10870170593261719, -0.10442352294921875, -0.10014533996582031, -0.09586715698242188, -0.09158897399902344, -0.087310791015625, -0.08303260803222656, -0.07875442504882812, -0.07447624206542969, -0.07019805908203125, -0.06591987609863281, -0.061641693115234375, -0.05736351013183594, -0.0530853271484375, -0.04880714416503906, -0.044528961181640625, -0.04025077819824219, -0.03597259521484375, -0.03169441223144531, -0.027416229248046875, -0.023138046264648438, -0.01885986328125, -0.014581680297851562, -0.010303497314453125, -0.0060253143310546875, -0.00174713134765625, 0.0025310516357421875, 0.006809234619140625, 0.011087417602539062, 0.0153656005859375, 0.019643783569335938, 0.023921966552734375, 0.028200149536132812, 0.03247833251953125, 0.03675651550292969, 0.041034698486328125, 0.04531288146972656, 0.049591064453125, 0.05386924743652344, 0.058147430419921875, 0.06242561340332031, 0.06670379638671875, 0.07098197937011719, 0.07526016235351562, 0.07953834533691406, 0.0838165283203125, 0.08809471130371094, 0.09237289428710938, 0.09665107727050781, 0.10092926025390625, 0.10520744323730469, 0.10948562622070312, 0.11376380920410156, 0.1180419921875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 7.0, 10.0, 11.0, 23.0, 27.0, 45.0, 64.0, 90.0, 154.0, 283.0, 570.0, 1387.0, 660.0, 292.0, 174.0, 82.0, 65.0, 41.0, 23.0, 18.0, 17.0, 6.0, 12.0, 7.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.078857421875, -0.07564735412597656, -0.07243728637695312, -0.06922721862792969, -0.06601715087890625, -0.06280708312988281, -0.059597015380859375, -0.05638694763183594, -0.0531768798828125, -0.04996681213378906, -0.046756744384765625, -0.04354667663574219, -0.04033660888671875, -0.03712654113769531, -0.033916473388671875, -0.030706405639648438, -0.027496337890625, -0.024286270141601562, -0.021076202392578125, -0.017866134643554688, -0.01465606689453125, -0.011445999145507812, -0.008235931396484375, -0.0050258636474609375, -0.0018157958984375, 0.0013942718505859375, 0.004604339599609375, 0.007814407348632812, 0.01102447509765625, 0.014234542846679688, 0.017444610595703125, 0.020654678344726562, 0.02386474609375, 0.027074813842773438, 0.030284881591796875, 0.03349494934082031, 0.03670501708984375, 0.03991508483886719, 0.043125152587890625, 0.04633522033691406, 0.0495452880859375, 0.05275535583496094, 0.055965423583984375, 0.05917549133300781, 0.06238555908203125, 0.06559562683105469, 0.06880569458007812, 0.07201576232910156, 0.075225830078125, 0.07843589782714844, 0.08164596557617188, 0.08485603332519531, 0.08806610107421875, 0.09127616882324219, 0.09448623657226562, 0.09769630432128906, 0.1009063720703125, 0.10411643981933594, 0.10732650756835938, 0.11053657531738281, 0.11374664306640625, 0.11695671081542969, 0.12016677856445312, 0.12337684631347656, 0.1265869140625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 10.0, 8.0, 17.0, 20.0, 30.0, 44.0, 56.0, 72.0, 94.0, 100.0, 115.0, 82.0, 78.0, 86.0, 61.0, 46.0, 29.0, 22.0, 12.0, 6.0, 9.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.33861249685287476, -0.32289037108421326, -0.30716824531555176, -0.29144614934921265, -0.27572402358055115, -0.26000189781188965, -0.24427978694438934, -0.22855767607688904, -0.21283555030822754, -0.19711342453956604, -0.18139131367206573, -0.16566920280456543, -0.14994707703590393, -0.13422495126724243, -0.11850284039974213, -0.10278072208166122, -0.08705860376358032, -0.07133648544549942, -0.05561436712741852, -0.039892248809337616, -0.024170130491256714, -0.008448012173175812, 0.00727410614490509, 0.022996224462985992, 0.038718342781066895, 0.0544404610991478, 0.0701625794172287, 0.0858846977353096, 0.1016068160533905, 0.1173289343714714, 0.1330510526895523, 0.1487731635570526, 0.16449522972106934, 0.18021735548973083, 0.19593946635723114, 0.21166157722473145, 0.22738370299339294, 0.24310582876205444, 0.25882792472839355, 0.27455005049705505, 0.29027217626571655, 0.30599430203437805, 0.32171642780303955, 0.33743852376937866, 0.35316064953804016, 0.36888277530670166, 0.38460487127304077, 0.40032699704170227, 0.41604912281036377, 0.43177124857902527, 0.44749337434768677, 0.4632154703140259, 0.4789375960826874, 0.4946597218513489, 0.510381817817688, 0.5261039733886719, 0.541826069355011, 0.5575481653213501, 0.573270320892334, 0.5889924168586731, 0.6047145128250122, 0.6204366683959961, 0.6361587643623352, 0.6518809199333191, 0.6676030158996582]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 4.0, 9.0, 9.0, 5.0, 9.0, 10.0, 12.0, 15.0, 20.0, 20.0, 26.0, 23.0, 28.0, 30.0, 37.0, 27.0, 56.0, 31.0, 46.0, 48.0, 37.0, 37.0, 40.0, 38.0, 39.0, 45.0, 36.0, 32.0, 28.0, 42.0, 26.0, 21.0, 22.0, 15.0, 15.0, 16.0, 9.0, 14.0, 7.0, 4.0, 5.0, 4.0, 1.0, 1.0, 1.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2956008315086365, -0.28671133518218994, -0.2778218388557434, -0.2689323425292969, -0.26004284620285034, -0.2511533498764038, -0.24226383864879608, -0.23337434232234955, -0.22448483109474182, -0.2155953347682953, -0.20670583844184875, -0.19781634211540222, -0.1889268308877945, -0.18003733456134796, -0.17114783823490143, -0.1622583419084549, -0.15336884558200836, -0.14447934925556183, -0.1355898529291153, -0.12670034170150757, -0.11781084537506104, -0.1089213490486145, -0.10003185272216797, -0.09114235639572144, -0.0822528526186943, -0.07336335629224777, -0.06447385251522064, -0.05558435618877411, -0.04669485613703728, -0.037805356085300446, -0.028915859758853912, -0.02002635970711708, -0.011136859655380249, -0.002247360534965992, 0.006642138585448265, 0.015531636774539948, 0.02442113682627678, 0.03331063687801361, 0.042200133204460144, 0.051089633256196976, 0.05997913330793381, 0.06886862963438034, 0.07775813341140747, 0.086647629737854, 0.09553712606430054, 0.10442662984132767, 0.1133161261677742, 0.12220562994480133, 0.13109512627124786, 0.1399846225976944, 0.14887411892414093, 0.15776363015174866, 0.1666531264781952, 0.17554262280464172, 0.18443211913108826, 0.1933216154575348, 0.20221111178398132, 0.21110060811042786, 0.2199901044368744, 0.22887960076332092, 0.23776911199092865, 0.24665860831737518, 0.2555481195449829, 0.26443761587142944, 0.273327112197876]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 10.0, 13.0, 22.0, 26.0, 51.0, 98.0, 166.0, 328.0, 581.0, 1060.0, 2170.0, 4510.0, 10126.0, 23692.0, 59477.0, 222221.0, 553883.0, 103168.0, 37974.0, 15869.0, 6649.0, 3098.0, 1567.0, 828.0, 402.0, 239.0, 139.0, 80.0, 35.0, 23.0, 18.0, 14.0, 7.0, 3.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1964111328125, -0.1905059814453125, -0.184600830078125, -0.1786956787109375, -0.17279052734375, -0.1668853759765625, -0.160980224609375, -0.1550750732421875, -0.149169921875, -0.1432647705078125, -0.137359619140625, -0.1314544677734375, -0.12554931640625, -0.1196441650390625, -0.113739013671875, -0.1078338623046875, -0.1019287109375, -0.0960235595703125, -0.090118408203125, -0.0842132568359375, -0.07830810546875, -0.0724029541015625, -0.066497802734375, -0.0605926513671875, -0.0546875, -0.0487823486328125, -0.042877197265625, -0.0369720458984375, -0.03106689453125, -0.0251617431640625, -0.019256591796875, -0.0133514404296875, -0.0074462890625, -0.0015411376953125, 0.004364013671875, 0.0102691650390625, 0.01617431640625, 0.0220794677734375, 0.027984619140625, 0.0338897705078125, 0.039794921875, 0.0457000732421875, 0.051605224609375, 0.0575103759765625, 0.06341552734375, 0.0693206787109375, 0.075225830078125, 0.0811309814453125, 0.0870361328125, 0.0929412841796875, 0.098846435546875, 0.1047515869140625, 0.11065673828125, 0.1165618896484375, 0.122467041015625, 0.1283721923828125, 0.13427734375, 0.1401824951171875, 0.146087646484375, 0.1519927978515625, 0.15789794921875, 0.1638031005859375, 0.169708251953125, 0.1756134033203125, 0.1815185546875]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 7.0, 8.0, 10.0, 17.0, 16.0, 25.0, 38.0, 51.0, 44.0, 47.0, 72.0, 71.0, 65.0, 72.0, 78.0, 70.0, 60.0, 55.0, 50.0, 28.0, 34.0, 25.0, 17.0, 16.0, 11.0, 5.0, 4.0, 5.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.045806884765625, -0.0442500114440918, -0.042693138122558594, -0.04113626480102539, -0.03957939147949219, -0.038022518157958984, -0.03646564483642578, -0.03490877151489258, -0.033351898193359375, -0.03179502487182617, -0.03023815155029297, -0.028681278228759766, -0.027124404907226562, -0.02556753158569336, -0.024010658264160156, -0.022453784942626953, -0.02089691162109375, -0.019340038299560547, -0.017783164978027344, -0.01622629165649414, -0.014669418334960938, -0.013112545013427734, -0.011555671691894531, -0.009998798370361328, -0.008441925048828125, -0.006885051727294922, -0.005328178405761719, -0.0037713050842285156, -0.0022144317626953125, -0.0006575584411621094, 0.0008993148803710938, 0.002456188201904297, 0.0040130615234375, 0.005569934844970703, 0.007126808166503906, 0.00868368148803711, 0.010240554809570312, 0.011797428131103516, 0.013354301452636719, 0.014911174774169922, 0.016468048095703125, 0.018024921417236328, 0.01958179473876953, 0.021138668060302734, 0.022695541381835938, 0.02425241470336914, 0.025809288024902344, 0.027366161346435547, 0.02892303466796875, 0.030479907989501953, 0.032036781311035156, 0.03359365463256836, 0.03515052795410156, 0.036707401275634766, 0.03826427459716797, 0.03982114791870117, 0.041378021240234375, 0.04293489456176758, 0.04449176788330078, 0.046048641204833984, 0.04760551452636719, 0.04916238784790039, 0.050719261169433594, 0.0522761344909668, 0.0538330078125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 7.0, 7.0, 6.0, 6.0, 5.0, 8.0, 15.0, 20.0, 26.0, 28.0, 45.0, 57.0, 79.0, 107.0, 164.0, 226.0, 371.0, 553.0, 1028.0, 2020.0, 5173.0, 16474.0, 59668.0, 366292.0, 496195.0, 69648.0, 19203.0, 5942.0, 2280.0, 1055.0, 592.0, 369.0, 240.0, 177.0, 145.0, 78.0, 65.0, 59.0, 38.0, 22.0, 20.0, 23.0, 8.0, 11.0, 2.0, 1.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2120361328125, -0.20520973205566406, -0.19838333129882812, -0.1915569305419922, -0.18473052978515625, -0.1779041290283203, -0.17107772827148438, -0.16425132751464844, -0.1574249267578125, -0.15059852600097656, -0.14377212524414062, -0.1369457244873047, -0.13011932373046875, -0.12329292297363281, -0.11646652221679688, -0.10964012145996094, -0.102813720703125, -0.09598731994628906, -0.08916091918945312, -0.08233451843261719, -0.07550811767578125, -0.06868171691894531, -0.061855316162109375, -0.05502891540527344, -0.0482025146484375, -0.04137611389160156, -0.034549713134765625, -0.027723312377929688, -0.02089691162109375, -0.014070510864257812, -0.007244110107421875, -0.0004177093505859375, 0.00640869140625, 0.013235092163085938, 0.020061492919921875, 0.026887893676757812, 0.03371429443359375, 0.04054069519042969, 0.047367095947265625, 0.05419349670410156, 0.0610198974609375, 0.06784629821777344, 0.07467269897460938, 0.08149909973144531, 0.08832550048828125, 0.09515190124511719, 0.10197830200195312, 0.10880470275878906, 0.115631103515625, 0.12245750427246094, 0.12928390502929688, 0.1361103057861328, 0.14293670654296875, 0.1497631072998047, 0.15658950805664062, 0.16341590881347656, 0.1702423095703125, 0.17706871032714844, 0.18389511108398438, 0.1907215118408203, 0.19754791259765625, 0.2043743133544922, 0.21120071411132812, 0.21802711486816406, 0.224853515625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 7.0, 2.0, 5.0, 7.0, 6.0, 14.0, 20.0, 32.0, 31.0, 31.0, 42.0, 32.0, 50.0, 49.0, 51.0, 56.0, 49.0, 60.0, 45.0, 64.0, 46.0, 54.0, 44.0, 32.0, 28.0, 33.0, 20.0, 25.0, 11.0, 12.0, 10.0, 10.0, 8.0, 5.0, 3.0, 6.0, 5.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.178955078125, -0.17360305786132812, -0.16825103759765625, -0.16289901733398438, -0.1575469970703125, -0.15219497680664062, -0.14684295654296875, -0.14149093627929688, -0.136138916015625, -0.13078689575195312, -0.12543487548828125, -0.12008285522460938, -0.1147308349609375, -0.10937881469726562, -0.10402679443359375, -0.09867477416992188, -0.09332275390625, -0.08797073364257812, -0.08261871337890625, -0.07726669311523438, -0.0719146728515625, -0.06656265258789062, -0.06121063232421875, -0.055858612060546875, -0.050506591796875, -0.045154571533203125, -0.03980255126953125, -0.034450531005859375, -0.0290985107421875, -0.023746490478515625, -0.01839447021484375, -0.013042449951171875, -0.0076904296875, -0.002338409423828125, 0.00301361083984375, 0.008365631103515625, 0.0137176513671875, 0.019069671630859375, 0.02442169189453125, 0.029773712158203125, 0.035125732421875, 0.040477752685546875, 0.04582977294921875, 0.051181793212890625, 0.0565338134765625, 0.061885833740234375, 0.06723785400390625, 0.07258987426757812, 0.07794189453125, 0.08329391479492188, 0.08864593505859375, 0.09399795532226562, 0.0993499755859375, 0.10470199584960938, 0.11005401611328125, 0.11540603637695312, 0.120758056640625, 0.12611007690429688, 0.13146209716796875, 0.13681411743164062, 0.1421661376953125, 0.14751815795898438, 0.15287017822265625, 0.15822219848632812, 0.16357421875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 12.0, 17.0, 30.0, 47.0, 63.0, 95.0, 169.0, 361.0, 803.0, 1894.0, 5187.0, 16760.0, 69768.0, 765689.0, 146754.0, 27920.0, 8096.0, 2778.0, 1092.0, 454.0, 241.0, 134.0, 72.0, 39.0, 29.0, 15.0, 12.0, 10.0, 4.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.2314453125, -0.22589397430419922, -0.22034263610839844, -0.21479129791259766, -0.20923995971679688, -0.2036886215209961, -0.1981372833251953, -0.19258594512939453, -0.18703460693359375, -0.18148326873779297, -0.1759319305419922, -0.1703805923461914, -0.16482925415039062, -0.15927791595458984, -0.15372657775878906, -0.14817523956298828, -0.1426239013671875, -0.13707256317138672, -0.13152122497558594, -0.12596988677978516, -0.12041854858398438, -0.1148672103881836, -0.10931587219238281, -0.10376453399658203, -0.09821319580078125, -0.09266185760498047, -0.08711051940917969, -0.0815591812133789, -0.07600784301757812, -0.07045650482177734, -0.06490516662597656, -0.05935382843017578, -0.053802490234375, -0.04825115203857422, -0.04269981384277344, -0.037148475646972656, -0.031597137451171875, -0.026045799255371094, -0.020494461059570312, -0.014943122863769531, -0.00939178466796875, -0.0038404464721679688, 0.0017108917236328125, 0.007262229919433594, 0.012813568115234375, 0.018364906311035156, 0.023916244506835938, 0.02946758270263672, 0.0350189208984375, 0.04057025909423828, 0.04612159729003906, 0.051672935485839844, 0.057224273681640625, 0.0627756118774414, 0.06832695007324219, 0.07387828826904297, 0.07942962646484375, 0.08498096466064453, 0.09053230285644531, 0.0960836410522461, 0.10163497924804688, 0.10718631744384766, 0.11273765563964844, 0.11828899383544922, 0.12384033203125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 5.0, 4.0, 13.0, 10.0, 11.0, 35.0, 61.0, 98.0, 124.0, 173.0, 165.0, 124.0, 64.0, 43.0, 20.0, 20.0, 9.0, 10.0, 5.0, 4.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002090930938720703, -0.000202864408493042, -0.00019663572311401367, -0.00019040703773498535, -0.00018417835235595703, -0.0001779496669769287, -0.0001717209815979004, -0.00016549229621887207, -0.00015926361083984375, -0.00015303492546081543, -0.0001468062400817871, -0.0001405775547027588, -0.00013434886932373047, -0.00012812018394470215, -0.00012189149856567383, -0.00011566281318664551, -0.00010943412780761719, -0.00010320544242858887, -9.697675704956055e-05, -9.074807167053223e-05, -8.45193862915039e-05, -7.829070091247559e-05, -7.206201553344727e-05, -6.583333015441895e-05, -5.9604644775390625e-05, -5.3375959396362305e-05, -4.7147274017333984e-05, -4.0918588638305664e-05, -3.4689903259277344e-05, -2.8461217880249023e-05, -2.2232532501220703e-05, -1.6003847122192383e-05, -9.775161743164062e-06, -3.546476364135742e-06, 2.682209014892578e-06, 8.910894393920898e-06, 1.5139579772949219e-05, 2.136826515197754e-05, 2.759695053100586e-05, 3.382563591003418e-05, 4.00543212890625e-05, 4.628300666809082e-05, 5.251169204711914e-05, 5.874037742614746e-05, 6.496906280517578e-05, 7.11977481842041e-05, 7.742643356323242e-05, 8.365511894226074e-05, 8.988380432128906e-05, 9.611248970031738e-05, 0.0001023411750793457, 0.00010856986045837402, 0.00011479854583740234, 0.00012102723121643066, 0.00012725591659545898, 0.0001334846019744873, 0.00013971328735351562, 0.00014594197273254395, 0.00015217065811157227, 0.00015839934349060059, 0.0001646280288696289, 0.00017085671424865723, 0.00017708539962768555, 0.00018331408500671387, 0.0001895427703857422]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 2.0, 7.0, 6.0, 6.0, 10.0, 12.0, 18.0, 26.0, 35.0, 43.0, 75.0, 95.0, 174.0, 268.0, 492.0, 1030.0, 2726.0, 8729.0, 36977.0, 381072.0, 557356.0, 43695.0, 10181.0, 3041.0, 1158.0, 546.0, 274.0, 160.0, 92.0, 62.0, 45.0, 35.0, 24.0, 23.0, 15.0, 14.0, 12.0, 7.0, 5.0, 3.0, 0.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1773681640625, -0.17215919494628906, -0.16695022583007812, -0.1617412567138672, -0.15653228759765625, -0.1513233184814453, -0.14611434936523438, -0.14090538024902344, -0.1356964111328125, -0.13048744201660156, -0.12527847290039062, -0.12006950378417969, -0.11486053466796875, -0.10965156555175781, -0.10444259643554688, -0.09923362731933594, -0.094024658203125, -0.08881568908691406, -0.08360671997070312, -0.07839775085449219, -0.07318878173828125, -0.06797981262207031, -0.06277084350585938, -0.05756187438964844, -0.0523529052734375, -0.04714393615722656, -0.041934967041015625, -0.03672599792480469, -0.03151702880859375, -0.026308059692382812, -0.021099090576171875, -0.015890121459960938, -0.01068115234375, -0.0054721832275390625, -0.000263214111328125, 0.0049457550048828125, 0.01015472412109375, 0.015363693237304688, 0.020572662353515625, 0.025781631469726562, 0.0309906005859375, 0.03619956970214844, 0.041408538818359375, 0.04661750793457031, 0.05182647705078125, 0.05703544616699219, 0.062244415283203125, 0.06745338439941406, 0.072662353515625, 0.07787132263183594, 0.08308029174804688, 0.08828926086425781, 0.09349822998046875, 0.09870719909667969, 0.10391616821289062, 0.10912513732910156, 0.1143341064453125, 0.11954307556152344, 0.12475204467773438, 0.1299610137939453, 0.13516998291015625, 0.1403789520263672, 0.14558792114257812, 0.15079689025878906, 0.156005859375]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 7.0, 8.0, 4.0, 5.0, 6.0, 4.0, 7.0, 15.0, 15.0, 23.0, 51.0, 63.0, 161.0, 239.0, 183.0, 69.0, 41.0, 20.0, 23.0, 13.0, 10.0, 12.0, 7.0, 4.0, 4.0, 8.0, 0.0, 2.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11566162109375, -0.1118783950805664, -0.10809516906738281, -0.10431194305419922, -0.10052871704101562, -0.09674549102783203, -0.09296226501464844, -0.08917903900146484, -0.08539581298828125, -0.08161258697509766, -0.07782936096191406, -0.07404613494873047, -0.07026290893554688, -0.06647968292236328, -0.06269645690917969, -0.058913230895996094, -0.0551300048828125, -0.051346778869628906, -0.04756355285644531, -0.04378032684326172, -0.039997100830078125, -0.03621387481689453, -0.03243064880371094, -0.028647422790527344, -0.02486419677734375, -0.021080970764160156, -0.017297744750976562, -0.013514518737792969, -0.009731292724609375, -0.005948066711425781, -0.0021648406982421875, 0.0016183853149414062, 0.005401611328125, 0.009184837341308594, 0.012968063354492188, 0.01675128936767578, 0.020534515380859375, 0.02431774139404297, 0.028100967407226562, 0.031884193420410156, 0.03566741943359375, 0.039450645446777344, 0.04323387145996094, 0.04701709747314453, 0.050800323486328125, 0.05458354949951172, 0.05836677551269531, 0.062150001525878906, 0.0659332275390625, 0.0697164535522461, 0.07349967956542969, 0.07728290557861328, 0.08106613159179688, 0.08484935760498047, 0.08863258361816406, 0.09241580963134766, 0.09619903564453125, 0.09998226165771484, 0.10376548767089844, 0.10754871368408203, 0.11133193969726562, 0.11511516571044922, 0.11889839172363281, 0.1226816177368164, 0.12646484375]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 13.0, 32.0, 52.0, 110.0, 168.0, 207.0, 173.0, 120.0, 64.0, 37.0, 16.0, 6.0, 3.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2968658208847046, -1.227510929107666, -1.1581560373306274, -1.0888011455535889, -1.0194463729858398, -0.9500914216041565, -0.8807365894317627, -0.8113816976547241, -0.7420268058776855, -0.672671914100647, -0.6033170223236084, -0.5339621901512146, -0.464607298374176, -0.39525240659713745, -0.32589754462242126, -0.2565426826477051, -0.1871877908706665, -0.11783291399478912, -0.04847803711891174, 0.020876839756965637, 0.09023171663284302, 0.1595866084098816, 0.22894147038459778, 0.29829633235931396, 0.36765122413635254, 0.4370061159133911, 0.5063610076904297, 0.5757158398628235, 0.6450707316398621, 0.7144256234169006, 0.7837804555892944, 0.853135347366333, 0.9224903583526611, 0.9918452501296997, 1.0612001419067383, 1.1305550336837769, 1.1999099254608154, 1.2692646980285645, 1.338619589805603, 1.4079744815826416, 1.4773293733596802, 1.5466842651367188, 1.6160391569137573, 1.685394048690796, 1.754748821258545, 1.824103832244873, 1.893458604812622, 1.9628134965896606, 2.032168388366699, 2.1015231609344482, 2.1708781719207764, 2.2402329444885254, 2.3095879554748535, 2.3789427280426025, 2.4482977390289307, 2.5176525115966797, 2.587007522583008, 2.656362295150757, 2.725717306137085, 2.795072078704834, 2.864427089691162, 2.933781862258911, 3.0031368732452393, 3.0724916458129883, 3.1418464183807373]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 4.0, 8.0, 8.0, 6.0, 9.0, 13.0, 13.0, 12.0, 11.0, 7.0, 18.0, 20.0, 17.0, 23.0, 30.0, 33.0, 35.0, 35.0, 41.0, 35.0, 29.0, 35.0, 32.0, 39.0, 45.0, 50.0, 28.0, 42.0, 34.0, 32.0, 35.0, 26.0, 14.0, 28.0, 18.0, 16.0, 23.0, 14.0, 15.0, 13.0, 11.0, 12.0, 12.0, 3.0, 5.0, 6.0, 3.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.6337169408798218, -0.613333523273468, -0.592950165271759, -0.5725667476654053, -0.5521833896636963, -0.5317999720573425, -0.5114165544509888, -0.4910331666469574, -0.470649778842926, -0.45026639103889465, -0.4298830032348633, -0.4094995856285095, -0.38911619782447815, -0.3687328100204468, -0.348349392414093, -0.32796600461006165, -0.3075826168060303, -0.2871992290019989, -0.26681584119796753, -0.24643242359161377, -0.2260490357875824, -0.20566564798355103, -0.18528224527835846, -0.1648988425731659, -0.14451545476913452, -0.12413205951452255, -0.10374866425991058, -0.08336526900529861, -0.06298187375068665, -0.042598478496074677, -0.022215083241462708, -0.0018316805362701416, 0.018551647663116455, 0.038935042917728424, 0.05931843817234039, 0.07970183342695236, 0.10008522868156433, 0.1204686239361763, 0.14085201919078827, 0.16123542189598083, 0.1816188097000122, 0.20200219750404358, 0.22238560020923615, 0.2427690029144287, 0.2631523907184601, 0.28353577852249146, 0.3039191961288452, 0.3243025839328766, 0.34468597173690796, 0.36506935954093933, 0.3854527473449707, 0.40583616495132446, 0.42621955275535583, 0.4466029405593872, 0.46698635816574097, 0.48736974596977234, 0.5077531337738037, 0.5281365513801575, 0.5485199093818665, 0.5689033269882202, 0.5892866849899292, 0.609670102596283, 0.6300535202026367, 0.6504368782043457, 0.6708202958106995]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 9.0, 3.0, 11.0, 22.0, 29.0, 26.0, 57.0, 108.0, 172.0, 285.0, 495.0, 972.0, 1772.0, 3513.0, 7853.0, 18569.0, 49749.0, 182878.0, 3003684.0, 753231.0, 109783.0, 34524.0, 13873.0, 6129.0, 2840.0, 1570.0, 856.0, 463.0, 293.0, 154.0, 132.0, 75.0, 55.0, 36.0, 22.0, 15.0, 14.0, 6.0, 5.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1458740234375, -0.14098358154296875, -0.1360931396484375, -0.13120269775390625, -0.126312255859375, -0.12142181396484375, -0.1165313720703125, -0.11164093017578125, -0.10675048828125, -0.10186004638671875, -0.0969696044921875, -0.09207916259765625, -0.087188720703125, -0.08229827880859375, -0.0774078369140625, -0.07251739501953125, -0.067626953125, -0.06273651123046875, -0.0578460693359375, -0.05295562744140625, -0.048065185546875, -0.04317474365234375, -0.0382843017578125, -0.03339385986328125, -0.02850341796875, -0.02361297607421875, -0.0187225341796875, -0.01383209228515625, -0.008941650390625, -0.00405120849609375, 0.0008392333984375, 0.00572967529296875, 0.0106201171875, 0.01551055908203125, 0.0204010009765625, 0.02529144287109375, 0.030181884765625, 0.03507232666015625, 0.0399627685546875, 0.04485321044921875, 0.04974365234375, 0.05463409423828125, 0.0595245361328125, 0.06441497802734375, 0.069305419921875, 0.07419586181640625, 0.0790863037109375, 0.08397674560546875, 0.0888671875, 0.09375762939453125, 0.0986480712890625, 0.10353851318359375, 0.108428955078125, 0.11331939697265625, 0.1182098388671875, 0.12310028076171875, 0.12799072265625, 0.13288116455078125, 0.1377716064453125, 0.14266204833984375, 0.147552490234375, 0.15244293212890625, 0.1573333740234375, 0.16222381591796875, 0.1671142578125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 5.0, 4.0, 3.0, 6.0, 11.0, 11.0, 16.0, 22.0, 19.0, 28.0, 35.0, 45.0, 53.0, 62.0, 52.0, 70.0, 62.0, 78.0, 63.0, 66.0, 58.0, 49.0, 46.0, 32.0, 25.0, 23.0, 13.0, 13.0, 12.0, 13.0, 5.0, 4.0, 4.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04876708984375, -0.04724264144897461, -0.04571819305419922, -0.04419374465942383, -0.04266929626464844, -0.04114484786987305, -0.039620399475097656, -0.038095951080322266, -0.036571502685546875, -0.035047054290771484, -0.033522605895996094, -0.0319981575012207, -0.030473709106445312, -0.028949260711669922, -0.02742481231689453, -0.02590036392211914, -0.02437591552734375, -0.02285146713256836, -0.02132701873779297, -0.019802570343017578, -0.018278121948242188, -0.016753673553466797, -0.015229225158691406, -0.013704776763916016, -0.012180328369140625, -0.010655879974365234, -0.009131431579589844, -0.007606983184814453, -0.0060825347900390625, -0.004558086395263672, -0.0030336380004882812, -0.0015091896057128906, 1.52587890625e-05, 0.0015397071838378906, 0.0030641555786132812, 0.004588603973388672, 0.0061130523681640625, 0.007637500762939453, 0.009161949157714844, 0.010686397552490234, 0.012210845947265625, 0.013735294342041016, 0.015259742736816406, 0.016784191131591797, 0.018308639526367188, 0.019833087921142578, 0.02135753631591797, 0.02288198471069336, 0.02440643310546875, 0.02593088150024414, 0.02745532989501953, 0.028979778289794922, 0.030504226684570312, 0.0320286750793457, 0.033553123474121094, 0.035077571868896484, 0.036602020263671875, 0.038126468658447266, 0.039650917053222656, 0.04117536544799805, 0.04269981384277344, 0.04422426223754883, 0.04574871063232422, 0.04727315902709961, 0.048797607421875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 4.0, 1.0, 3.0, 11.0, 6.0, 9.0, 14.0, 18.0, 22.0, 32.0, 44.0, 76.0, 104.0, 169.0, 226.0, 373.0, 641.0, 1013.0, 1905.0, 3397.0, 7079.0, 15147.0, 35458.0, 98032.0, 412957.0, 2965374.0, 473701.0, 107494.0, 38430.0, 16246.0, 7703.0, 3778.0, 1964.0, 1099.0, 649.0, 395.0, 268.0, 163.0, 97.0, 56.0, 44.0, 26.0, 19.0, 7.0, 8.0, 9.0, 4.0, 3.0, 4.0, 3.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.1346435546875, -0.13008499145507812, -0.12552642822265625, -0.12096786499023438, -0.1164093017578125, -0.11185073852539062, -0.10729217529296875, -0.10273361206054688, -0.098175048828125, -0.09361648559570312, -0.08905792236328125, -0.08449935913085938, -0.0799407958984375, -0.07538223266601562, -0.07082366943359375, -0.06626510620117188, -0.06170654296875, -0.057147979736328125, -0.05258941650390625, -0.048030853271484375, -0.0434722900390625, -0.038913726806640625, -0.03435516357421875, -0.029796600341796875, -0.025238037109375, -0.020679473876953125, -0.01612091064453125, -0.011562347412109375, -0.0070037841796875, -0.002445220947265625, 0.00211334228515625, 0.006671905517578125, 0.01123046875, 0.015789031982421875, 0.02034759521484375, 0.024906158447265625, 0.0294647216796875, 0.034023284912109375, 0.03858184814453125, 0.043140411376953125, 0.047698974609375, 0.052257537841796875, 0.05681610107421875, 0.061374664306640625, 0.0659332275390625, 0.07049179077148438, 0.07505035400390625, 0.07960891723632812, 0.08416748046875, 0.08872604370117188, 0.09328460693359375, 0.09784317016601562, 0.1024017333984375, 0.10696029663085938, 0.11151885986328125, 0.11607742309570312, 0.120635986328125, 0.12519454956054688, 0.12975311279296875, 0.13431167602539062, 0.1388702392578125, 0.14342880249023438, 0.14798736572265625, 0.15254592895507812, 0.1571044921875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 7.0, 3.0, 12.0, 5.0, 13.0, 22.0, 23.0, 42.0, 53.0, 66.0, 97.0, 155.0, 276.0, 560.0, 1342.0, 584.0, 277.0, 165.0, 98.0, 71.0, 47.0, 34.0, 22.0, 22.0, 14.0, 15.0, 14.0, 9.0, 5.0, 8.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.06536865234375, -0.06307601928710938, -0.06078338623046875, -0.058490753173828125, -0.0561981201171875, -0.053905487060546875, -0.05161285400390625, -0.049320220947265625, -0.047027587890625, -0.044734954833984375, -0.04244232177734375, -0.040149688720703125, -0.0378570556640625, -0.035564422607421875, -0.03327178955078125, -0.030979156494140625, -0.0286865234375, -0.026393890380859375, -0.02410125732421875, -0.021808624267578125, -0.0195159912109375, -0.017223358154296875, -0.01493072509765625, -0.012638092041015625, -0.010345458984375, -0.008052825927734375, -0.00576019287109375, -0.003467559814453125, -0.0011749267578125, 0.001117706298828125, 0.00341033935546875, 0.005702972412109375, 0.00799560546875, 0.010288238525390625, 0.01258087158203125, 0.014873504638671875, 0.0171661376953125, 0.019458770751953125, 0.02175140380859375, 0.024044036865234375, 0.026336669921875, 0.028629302978515625, 0.03092193603515625, 0.033214569091796875, 0.0355072021484375, 0.037799835205078125, 0.04009246826171875, 0.042385101318359375, 0.044677734375, 0.046970367431640625, 0.04926300048828125, 0.051555633544921875, 0.0538482666015625, 0.056140899658203125, 0.05843353271484375, 0.060726165771484375, 0.063018798828125, 0.06531143188476562, 0.06760406494140625, 0.06989669799804688, 0.0721893310546875, 0.07448196411132812, 0.07677459716796875, 0.07906723022460938, 0.08135986328125]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 4.0, 8.0, 15.0, 37.0, 97.0, 212.0, 238.0, 213.0, 110.0, 47.0, 18.0, 9.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.186853289604187, -1.1517101526260376, -1.1165670156478882, -1.0814238786697388, -1.0462807416915894, -1.01113760471344, -0.9759945273399353, -0.9408513903617859, -0.9057082533836365, -0.8705651164054871, -0.8354219794273376, -0.8002788424491882, -0.7651357650756836, -0.7299926280975342, -0.6948494911193848, -0.6597063541412354, -0.6245632171630859, -0.5894200801849365, -0.5542769432067871, -0.5191338062286377, -0.48399069905281067, -0.44884756207466125, -0.41370445489883423, -0.3785613179206848, -0.3434181809425354, -0.308275043964386, -0.2731319069862366, -0.23798879981040955, -0.20284566283226013, -0.16770252585411072, -0.1325594037771225, -0.09741628170013428, -0.06227302551269531, -0.027129895985126495, 0.008013233542442322, 0.04315636307001114, 0.07829949259757996, 0.11344262957572937, 0.1485857516527176, 0.1837288737297058, 0.21887201070785522, 0.25401514768600464, 0.28915828466415405, 0.3243013918399811, 0.3594445288181305, 0.3945876657962799, 0.42973077297210693, 0.46487390995025635, 0.5000170469284058, 0.5351601839065552, 0.5703033208847046, 0.605446457862854, 0.6405895948410034, 0.6757327318191528, 0.7108758091926575, 0.7460189461708069, 0.7811620831489563, 0.8163052201271057, 0.8514483571052551, 0.8865914940834045, 0.9217345714569092, 0.9568777084350586, 0.992020845413208, 1.0271639823913574, 1.0623071193695068]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 4.0, 4.0, 2.0, 4.0, 4.0, 5.0, 6.0, 6.0, 7.0, 13.0, 12.0, 22.0, 14.0, 14.0, 26.0, 25.0, 22.0, 20.0, 40.0, 31.0, 29.0, 42.0, 51.0, 37.0, 38.0, 25.0, 39.0, 33.0, 35.0, 33.0, 37.0, 31.0, 23.0, 25.0, 32.0, 30.0, 20.0, 28.0, 22.0, 19.0, 16.0, 16.0, 17.0, 2.0, 14.0, 9.0, 8.0, 3.0, 5.0, 5.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.22011446952819824, -0.21283075213432312, -0.205547034740448, -0.19826331734657288, -0.19097959995269775, -0.18369588255882263, -0.1764121651649475, -0.1691284477710724, -0.16184473037719727, -0.15456101298332214, -0.14727729558944702, -0.1399935781955719, -0.13270986080169678, -0.12542614340782166, -0.11814243346452713, -0.11085871607065201, -0.10357500612735748, -0.09629128873348236, -0.08900757133960724, -0.08172385394573212, -0.074440136551857, -0.06715641915798187, -0.05987270921468735, -0.052588991820812225, -0.0453052744269371, -0.03802155703306198, -0.03073784150183201, -0.023454125970602036, -0.016170408576726913, -0.008886691182851791, -0.0016029775142669678, 0.005680739879608154, 0.012964457273483276, 0.0202481746673584, 0.02753189019858837, 0.034815605729818344, 0.042099323123693466, 0.04938304051756859, 0.05666675418615341, 0.06395047158002853, 0.07123418897390366, 0.07851790636777878, 0.0858016237616539, 0.09308533370494843, 0.10036905109882355, 0.10765276849269867, 0.11493648588657379, 0.12222020328044891, 0.12950392067432404, 0.13678763806819916, 0.14407135546207428, 0.1513550728559494, 0.15863879024982452, 0.16592250764369965, 0.17320621013641357, 0.1804899275302887, 0.18777364492416382, 0.19505736231803894, 0.20234107971191406, 0.20962479710578918, 0.2169085144996643, 0.22419223189353943, 0.23147594928741455, 0.23875966668128967, 0.2460433840751648]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 4.0, 5.0, 6.0, 6.0, 21.0, 30.0, 32.0, 59.0, 96.0, 142.0, 265.0, 493.0, 993.0, 2166.0, 4796.0, 10639.0, 23124.0, 50998.0, 209346.0, 555652.0, 117588.0, 38564.0, 18054.0, 8251.0, 3744.0, 1736.0, 810.0, 400.0, 196.0, 141.0, 65.0, 34.0, 30.0, 18.0, 22.0, 9.0, 5.0, 5.0, 8.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.1737060546875, -0.1690540313720703, -0.16440200805664062, -0.15974998474121094, -0.15509796142578125, -0.15044593811035156, -0.14579391479492188, -0.1411418914794922, -0.1364898681640625, -0.1318378448486328, -0.12718582153320312, -0.12253379821777344, -0.11788177490234375, -0.11322975158691406, -0.10857772827148438, -0.10392570495605469, -0.099273681640625, -0.09462165832519531, -0.08996963500976562, -0.08531761169433594, -0.08066558837890625, -0.07601356506347656, -0.07136154174804688, -0.06670951843261719, -0.0620574951171875, -0.05740547180175781, -0.052753448486328125, -0.04810142517089844, -0.04344940185546875, -0.03879737854003906, -0.034145355224609375, -0.029493331909179688, -0.02484130859375, -0.020189285278320312, -0.015537261962890625, -0.010885238647460938, -0.00623321533203125, -0.0015811920166015625, 0.003070831298828125, 0.0077228546142578125, 0.0123748779296875, 0.017026901245117188, 0.021678924560546875, 0.026330947875976562, 0.03098297119140625, 0.03563499450683594, 0.040287017822265625, 0.04493904113769531, 0.049591064453125, 0.05424308776855469, 0.058895111083984375, 0.06354713439941406, 0.06819915771484375, 0.07285118103027344, 0.07750320434570312, 0.08215522766113281, 0.0868072509765625, 0.09145927429199219, 0.09611129760742188, 0.10076332092285156, 0.10541534423828125, 0.11006736755371094, 0.11471939086914062, 0.11937141418457031, 0.1240234375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 5.0, 6.0, 8.0, 5.0, 10.0, 10.0, 25.0, 29.0, 34.0, 28.0, 43.0, 49.0, 57.0, 52.0, 73.0, 49.0, 63.0, 51.0, 55.0, 55.0, 50.0, 39.0, 47.0, 42.0, 27.0, 20.0, 16.0, 9.0, 20.0, 9.0, 6.0, 4.0, 6.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.050140380859375, -0.04868936538696289, -0.04723834991455078, -0.04578733444213867, -0.04433631896972656, -0.04288530349731445, -0.041434288024902344, -0.039983272552490234, -0.038532257080078125, -0.037081241607666016, -0.035630226135253906, -0.0341792106628418, -0.03272819519042969, -0.03127717971801758, -0.02982616424560547, -0.02837514877319336, -0.02692413330078125, -0.02547311782836914, -0.02402210235595703, -0.022571086883544922, -0.021120071411132812, -0.019669055938720703, -0.018218040466308594, -0.016767024993896484, -0.015316009521484375, -0.013864994049072266, -0.012413978576660156, -0.010962963104248047, -0.009511947631835938, -0.008060932159423828, -0.006609916687011719, -0.005158901214599609, -0.0037078857421875, -0.0022568702697753906, -0.0008058547973632812, 0.0006451606750488281, 0.0020961761474609375, 0.003547191619873047, 0.004998207092285156, 0.006449222564697266, 0.007900238037109375, 0.009351253509521484, 0.010802268981933594, 0.012253284454345703, 0.013704299926757812, 0.015155315399169922, 0.01660633087158203, 0.01805734634399414, 0.01950836181640625, 0.02095937728881836, 0.02241039276123047, 0.023861408233642578, 0.025312423706054688, 0.026763439178466797, 0.028214454650878906, 0.029665470123291016, 0.031116485595703125, 0.032567501068115234, 0.034018516540527344, 0.03546953201293945, 0.03692054748535156, 0.03837156295776367, 0.03982257843017578, 0.04127359390258789, 0.042724609375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 5.0, 3.0, 3.0, 9.0, 7.0, 10.0, 15.0, 24.0, 33.0, 25.0, 38.0, 71.0, 98.0, 149.0, 253.0, 418.0, 804.0, 1689.0, 3916.0, 9263.0, 22523.0, 53123.0, 368232.0, 486036.0, 58696.0, 24552.0, 10353.0, 4213.0, 1874.0, 863.0, 481.0, 265.0, 149.0, 93.0, 80.0, 44.0, 37.0, 33.0, 21.0, 15.0, 12.0, 9.0, 6.0, 5.0, 5.0, 2.0, 6.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.191162109375, -0.1855487823486328, -0.17993545532226562, -0.17432212829589844, -0.16870880126953125, -0.16309547424316406, -0.15748214721679688, -0.1518688201904297, -0.1462554931640625, -0.1406421661376953, -0.13502883911132812, -0.12941551208496094, -0.12380218505859375, -0.11818885803222656, -0.11257553100585938, -0.10696220397949219, -0.101348876953125, -0.09573554992675781, -0.09012222290039062, -0.08450889587402344, -0.07889556884765625, -0.07328224182128906, -0.06766891479492188, -0.06205558776855469, -0.0564422607421875, -0.05082893371582031, -0.045215606689453125, -0.03960227966308594, -0.03398895263671875, -0.028375625610351562, -0.022762298583984375, -0.017148971557617188, -0.01153564453125, -0.0059223175048828125, -0.000308990478515625, 0.0053043365478515625, 0.01091766357421875, 0.016530990600585938, 0.022144317626953125, 0.027757644653320312, 0.0333709716796875, 0.03898429870605469, 0.044597625732421875, 0.05021095275878906, 0.05582427978515625, 0.06143760681152344, 0.06705093383789062, 0.07266426086425781, 0.078277587890625, 0.08389091491699219, 0.08950424194335938, 0.09511756896972656, 0.10073089599609375, 0.10634422302246094, 0.11195755004882812, 0.11757087707519531, 0.1231842041015625, 0.1287975311279297, 0.13441085815429688, 0.14002418518066406, 0.14563751220703125, 0.15125083923339844, 0.15686416625976562, 0.1624774932861328, 0.1680908203125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 8.0, 5.0, 4.0, 12.0, 15.0, 8.0, 10.0, 18.0, 20.0, 26.0, 33.0, 33.0, 47.0, 48.0, 40.0, 49.0, 42.0, 67.0, 56.0, 66.0, 58.0, 59.0, 44.0, 39.0, 37.0, 24.0, 23.0, 32.0, 17.0, 9.0, 10.0, 12.0, 10.0, 11.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.181396484375, -0.17522239685058594, -0.16904830932617188, -0.1628742218017578, -0.15670013427734375, -0.1505260467529297, -0.14435195922851562, -0.13817787170410156, -0.1320037841796875, -0.12582969665527344, -0.11965560913085938, -0.11348152160644531, -0.10730743408203125, -0.10113334655761719, -0.09495925903320312, -0.08878517150878906, -0.082611083984375, -0.07643699645996094, -0.07026290893554688, -0.06408882141113281, -0.05791473388671875, -0.05174064636230469, -0.045566558837890625, -0.03939247131347656, -0.0332183837890625, -0.027044296264648438, -0.020870208740234375, -0.014696121215820312, -0.00852203369140625, -0.0023479461669921875, 0.003826141357421875, 0.010000228881835938, 0.01617431640625, 0.022348403930664062, 0.028522491455078125, 0.03469657897949219, 0.04087066650390625, 0.04704475402832031, 0.053218841552734375, 0.05939292907714844, 0.0655670166015625, 0.07174110412597656, 0.07791519165039062, 0.08408927917480469, 0.09026336669921875, 0.09643745422363281, 0.10261154174804688, 0.10878562927246094, 0.114959716796875, 0.12113380432128906, 0.12730789184570312, 0.1334819793701172, 0.13965606689453125, 0.1458301544189453, 0.15200424194335938, 0.15817832946777344, 0.1643524169921875, 0.17052650451660156, 0.17670059204101562, 0.1828746795654297, 0.18904876708984375, 0.1952228546142578, 0.20139694213867188, 0.20757102966308594, 0.2137451171875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 7.0, 3.0, 6.0, 4.0, 9.0, 7.0, 16.0, 17.0, 25.0, 41.0, 65.0, 90.0, 127.0, 236.0, 373.0, 679.0, 1327.0, 2921.0, 6301.0, 15024.0, 38731.0, 181980.0, 694308.0, 64904.0, 23644.0, 9472.0, 4108.0, 1890.0, 907.0, 505.0, 327.0, 177.0, 116.0, 63.0, 45.0, 24.0, 28.0, 21.0, 7.0, 7.0, 9.0, 6.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.10955810546875, -0.10581111907958984, -0.10206413269042969, -0.09831714630126953, -0.09457015991210938, -0.09082317352294922, -0.08707618713378906, -0.0833292007446289, -0.07958221435546875, -0.0758352279663086, -0.07208824157714844, -0.06834125518798828, -0.06459426879882812, -0.06084728240966797, -0.05710029602050781, -0.053353309631347656, -0.0496063232421875, -0.045859336853027344, -0.04211235046386719, -0.03836536407470703, -0.034618377685546875, -0.03087139129638672, -0.027124404907226562, -0.023377418518066406, -0.01963043212890625, -0.015883445739746094, -0.012136459350585938, -0.008389472961425781, -0.004642486572265625, -0.0008955001831054688, 0.0028514862060546875, 0.006598472595214844, 0.010345458984375, 0.014092445373535156, 0.017839431762695312, 0.02158641815185547, 0.025333404541015625, 0.02908039093017578, 0.03282737731933594, 0.036574363708496094, 0.04032135009765625, 0.044068336486816406, 0.04781532287597656, 0.05156230926513672, 0.055309295654296875, 0.05905628204345703, 0.06280326843261719, 0.06655025482177734, 0.0702972412109375, 0.07404422760009766, 0.07779121398925781, 0.08153820037841797, 0.08528518676757812, 0.08903217315673828, 0.09277915954589844, 0.0965261459350586, 0.10027313232421875, 0.1040201187133789, 0.10776710510253906, 0.11151409149169922, 0.11526107788085938, 0.11900806427001953, 0.12275505065917969, 0.12650203704833984, 0.1302490234375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 4.0, 3.0, 6.0, 6.0, 8.0, 10.0, 8.0, 19.0, 35.0, 34.0, 46.0, 59.0, 62.0, 75.0, 85.0, 110.0, 82.0, 86.0, 67.0, 56.0, 46.0, 27.0, 23.0, 16.0, 11.0, 4.0, 5.0, 7.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.903575897216797e-05, -7.579661905765533e-05, -7.25574791431427e-05, -6.931833922863007e-05, -6.607919931411743e-05, -6.28400593996048e-05, -5.960091948509216e-05, -5.636177957057953e-05, -5.3122639656066895e-05, -4.988349974155426e-05, -4.6644359827041626e-05, -4.340521991252899e-05, -4.016607999801636e-05, -3.692694008350372e-05, -3.368780016899109e-05, -3.0448660254478455e-05, -2.720952033996582e-05, -2.3970380425453186e-05, -2.0731240510940552e-05, -1.7492100596427917e-05, -1.4252960681915283e-05, -1.1013820767402649e-05, -7.774680852890015e-06, -4.53554093837738e-06, -1.296401023864746e-06, 1.942738890647888e-06, 5.1818788051605225e-06, 8.421018719673157e-06, 1.1660158634185791e-05, 1.4899298548698425e-05, 1.813843846321106e-05, 2.1377578377723694e-05, 2.4616718292236328e-05, 2.7855858206748962e-05, 3.10949981212616e-05, 3.433413803577423e-05, 3.7573277950286865e-05, 4.08124178647995e-05, 4.4051557779312134e-05, 4.729069769382477e-05, 5.05298376083374e-05, 5.376897752285004e-05, 5.700811743736267e-05, 6.0247257351875305e-05, 6.348639726638794e-05, 6.672553718090057e-05, 6.996467709541321e-05, 7.320381700992584e-05, 7.644295692443848e-05, 7.968209683895111e-05, 8.292123675346375e-05, 8.616037666797638e-05, 8.939951658248901e-05, 9.263865649700165e-05, 9.587779641151428e-05, 9.911693632602692e-05, 0.00010235607624053955, 0.00010559521615505219, 0.00010883435606956482, 0.00011207349598407745, 0.00011531263589859009, 0.00011855177581310272, 0.00012179091572761536, 0.000125030055642128, 0.00012826919555664062]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 4.0, 5.0, 9.0, 11.0, 19.0, 49.0, 78.0, 138.0, 257.0, 674.0, 1788.0, 6105.0, 25007.0, 193308.0, 761639.0, 45007.0, 10051.0, 2749.0, 875.0, 385.0, 161.0, 95.0, 43.0, 35.0, 15.0, 16.0, 14.0, 6.0, 2.0, 5.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1688232421875, -0.1626129150390625, -0.156402587890625, -0.1501922607421875, -0.14398193359375, -0.1377716064453125, -0.131561279296875, -0.1253509521484375, -0.119140625, -0.1129302978515625, -0.106719970703125, -0.1005096435546875, -0.09429931640625, -0.0880889892578125, -0.081878662109375, -0.0756683349609375, -0.0694580078125, -0.0632476806640625, -0.057037353515625, -0.0508270263671875, -0.04461669921875, -0.0384063720703125, -0.032196044921875, -0.0259857177734375, -0.019775390625, -0.0135650634765625, -0.007354736328125, -0.0011444091796875, 0.00506591796875, 0.0112762451171875, 0.017486572265625, 0.0236968994140625, 0.0299072265625, 0.0361175537109375, 0.042327880859375, 0.0485382080078125, 0.05474853515625, 0.0609588623046875, 0.067169189453125, 0.0733795166015625, 0.07958984375, 0.0858001708984375, 0.092010498046875, 0.0982208251953125, 0.10443115234375, 0.1106414794921875, 0.116851806640625, 0.1230621337890625, 0.1292724609375, 0.1354827880859375, 0.141693115234375, 0.1479034423828125, 0.15411376953125, 0.1603240966796875, 0.166534423828125, 0.1727447509765625, 0.178955078125, 0.1851654052734375, 0.191375732421875, 0.1975860595703125, 0.20379638671875, 0.2100067138671875, 0.216217041015625, 0.2224273681640625, 0.2286376953125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 4.0, 6.0, 6.0, 6.0, 10.0, 10.0, 10.0, 19.0, 20.0, 28.0, 41.0, 95.0, 204.0, 268.0, 116.0, 48.0, 33.0, 22.0, 18.0, 13.0, 4.0, 6.0, 4.0, 5.0, 3.0, 2.0, 2.0, 3.0, 3.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12445068359375, -0.1200418472290039, -0.11563301086425781, -0.11122417449951172, -0.10681533813476562, -0.10240650177001953, -0.09799766540527344, -0.09358882904052734, -0.08917999267578125, -0.08477115631103516, -0.08036231994628906, -0.07595348358154297, -0.07154464721679688, -0.06713581085205078, -0.06272697448730469, -0.058318138122558594, -0.0539093017578125, -0.049500465393066406, -0.04509162902832031, -0.04068279266357422, -0.036273956298828125, -0.03186511993408203, -0.027456283569335938, -0.023047447204589844, -0.01863861083984375, -0.014229774475097656, -0.009820938110351562, -0.005412101745605469, -0.001003265380859375, 0.0034055709838867188, 0.007814407348632812, 0.012223243713378906, 0.016632080078125, 0.021040916442871094, 0.025449752807617188, 0.02985858917236328, 0.034267425537109375, 0.03867626190185547, 0.04308509826660156, 0.047493934631347656, 0.05190277099609375, 0.056311607360839844, 0.06072044372558594, 0.06512928009033203, 0.06953811645507812, 0.07394695281982422, 0.07835578918457031, 0.0827646255493164, 0.0871734619140625, 0.0915822982788086, 0.09599113464355469, 0.10039997100830078, 0.10480880737304688, 0.10921764373779297, 0.11362648010253906, 0.11803531646728516, 0.12244415283203125, 0.12685298919677734, 0.13126182556152344, 0.13567066192626953, 0.14007949829101562, 0.14448833465576172, 0.1488971710205078, 0.1533060073852539, 0.15771484375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 4.0, 16.0, 24.0, 46.0, 68.0, 109.0, 151.0, 162.0, 153.0, 111.0, 72.0, 37.0, 24.0, 19.0, 6.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6694378852844238, -1.613257646560669, -1.5570772886276245, -1.50089693069458, -1.4447166919708252, -1.3885364532470703, -1.3323560953140259, -1.2761757373809814, -1.2199954986572266, -1.1638152599334717, -1.1076349020004272, -1.0514545440673828, -0.9952743053436279, -0.9390940070152283, -0.8829137086868286, -0.826733410358429, -0.7705531120300293, -0.7143728137016296, -0.65819251537323, -0.6020122170448303, -0.5458319187164307, -0.489651620388031, -0.43347132205963135, -0.3772910237312317, -0.32111072540283203, -0.2649304270744324, -0.20875012874603271, -0.15256983041763306, -0.0963895320892334, -0.04020923376083374, 0.015971064567565918, 0.07215136289596558, 0.12833166122436523, 0.1845119595527649, 0.24069225788116455, 0.2968725562095642, 0.35305285453796387, 0.4092331528663635, 0.4654134511947632, 0.5215937495231628, 0.5777740478515625, 0.6339543461799622, 0.6901346445083618, 0.7463149428367615, 0.8024952411651611, 0.8586755394935608, 0.9148558378219604, 0.9710361361503601, 1.0272164344787598, 1.0833966732025146, 1.139577031135559, 1.1957573890686035, 1.2519376277923584, 1.3081178665161133, 1.3642982244491577, 1.4204785823822021, 1.476658821105957, 1.532839059829712, 1.5890194177627563, 1.6451997756958008, 1.7013800144195557, 1.7575602531433105, 1.813740611076355, 1.8699209690093994, 1.9261012077331543]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 2.0, 1.0, 4.0, 3.0, 3.0, 7.0, 5.0, 6.0, 11.0, 8.0, 12.0, 16.0, 13.0, 14.0, 25.0, 13.0, 30.0, 34.0, 26.0, 42.0, 47.0, 28.0, 48.0, 44.0, 38.0, 39.0, 36.0, 37.0, 32.0, 37.0, 43.0, 34.0, 32.0, 38.0, 37.0, 28.0, 23.0, 14.0, 14.0, 12.0, 16.0, 8.0, 7.0, 7.0, 5.0, 5.0, 9.0, 7.0, 2.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.6811830997467041, -0.6585243344306946, -0.6358655691146851, -0.6132067441940308, -0.5905479788780212, -0.5678892135620117, -0.5452304482460022, -0.5225716829299927, -0.4999128580093384, -0.47725409269332886, -0.45459529757499695, -0.4319365322589874, -0.4092777371406555, -0.386618971824646, -0.3639602065086365, -0.34130141139030457, -0.31864264607429504, -0.2959838807582855, -0.2733250856399536, -0.2506663203239441, -0.22800752520561218, -0.20534875988960266, -0.18268997967243195, -0.16003119945526123, -0.13737241923809052, -0.1147136390209198, -0.09205485880374908, -0.06939608603715897, -0.04673730581998825, -0.024078525602817535, -0.001419752836227417, 0.0212390273809433, 0.043897807598114014, 0.06655658781528473, 0.08921536803245544, 0.11187414079904556, 0.13453292846679688, 0.1571916937828064, 0.1798504739999771, 0.20250925421714783, 0.22516803443431854, 0.24782681465148926, 0.2704855799674988, 0.2931443750858307, 0.3158031404018402, 0.3384619355201721, 0.36112070083618164, 0.38377946615219116, 0.40643826127052307, 0.4290970265865326, 0.4517558217048645, 0.474414587020874, 0.49707338213920593, 0.5197321772575378, 0.5423909425735474, 0.5650497078895569, 0.5877084732055664, 0.6103672385215759, 0.6330260038375854, 0.6556848287582397, 0.6783435940742493, 0.7010023593902588, 0.7236611247062683, 0.7463198900222778, 0.7689787149429321]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0, 3.0, 9.0, 7.0, 5.0, 10.0, 12.0, 25.0, 41.0, 61.0, 84.0, 150.0, 220.0, 419.0, 705.0, 1297.0, 2507.0, 5485.0, 12456.0, 32201.0, 102577.0, 647832.0, 3116068.0, 189085.0, 50267.0, 18040.0, 7606.0, 3413.0, 1641.0, 826.0, 486.0, 279.0, 155.0, 114.0, 60.0, 45.0, 32.0, 21.0, 15.0, 10.0, 6.0, 3.0, 1.0, 7.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17919921875, -0.17284584045410156, -0.16649246215820312, -0.1601390838623047, -0.15378570556640625, -0.1474323272705078, -0.14107894897460938, -0.13472557067871094, -0.1283721923828125, -0.12201881408691406, -0.11566543579101562, -0.10931205749511719, -0.10295867919921875, -0.09660530090332031, -0.09025192260742188, -0.08389854431152344, -0.077545166015625, -0.07119178771972656, -0.06483840942382812, -0.05848503112792969, -0.05213165283203125, -0.04577827453613281, -0.039424896240234375, -0.03307151794433594, -0.0267181396484375, -0.020364761352539062, -0.014011383056640625, -0.0076580047607421875, -0.00130462646484375, 0.0050487518310546875, 0.011402130126953125, 0.017755508422851562, 0.02410888671875, 0.030462265014648438, 0.036815643310546875, 0.04316902160644531, 0.04952239990234375, 0.05587577819824219, 0.062229156494140625, 0.06858253479003906, 0.0749359130859375, 0.08128929138183594, 0.08764266967773438, 0.09399604797363281, 0.10034942626953125, 0.10670280456542969, 0.11305618286132812, 0.11940956115722656, 0.125762939453125, 0.13211631774902344, 0.13846969604492188, 0.1448230743408203, 0.15117645263671875, 0.1575298309326172, 0.16388320922851562, 0.17023658752441406, 0.1765899658203125, 0.18294334411621094, 0.18929672241210938, 0.1956501007080078, 0.20200347900390625, 0.2083568572998047, 0.21471023559570312, 0.22106361389160156, 0.2274169921875]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 5.0, 1.0, 4.0, 9.0, 8.0, 14.0, 34.0, 29.0, 20.0, 33.0, 33.0, 40.0, 52.0, 49.0, 44.0, 67.0, 64.0, 50.0, 50.0, 70.0, 45.0, 54.0, 49.0, 27.0, 39.0, 30.0, 18.0, 19.0, 10.0, 6.0, 5.0, 6.0, 9.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05169677734375, -0.05021381378173828, -0.04873085021972656, -0.047247886657714844, -0.045764923095703125, -0.044281959533691406, -0.04279899597167969, -0.04131603240966797, -0.03983306884765625, -0.03835010528564453, -0.03686714172363281, -0.035384178161621094, -0.033901214599609375, -0.032418251037597656, -0.030935287475585938, -0.02945232391357422, -0.0279693603515625, -0.02648639678955078, -0.025003433227539062, -0.023520469665527344, -0.022037506103515625, -0.020554542541503906, -0.019071578979492188, -0.01758861541748047, -0.01610565185546875, -0.014622688293457031, -0.013139724731445312, -0.011656761169433594, -0.010173797607421875, -0.008690834045410156, -0.0072078704833984375, -0.005724906921386719, -0.004241943359375, -0.0027589797973632812, -0.0012760162353515625, 0.00020694732666015625, 0.001689910888671875, 0.0031728744506835938, 0.0046558380126953125, 0.006138801574707031, 0.00762176513671875, 0.009104728698730469, 0.010587692260742188, 0.012070655822753906, 0.013553619384765625, 0.015036582946777344, 0.016519546508789062, 0.01800251007080078, 0.0194854736328125, 0.02096843719482422, 0.022451400756835938, 0.023934364318847656, 0.025417327880859375, 0.026900291442871094, 0.028383255004882812, 0.02986621856689453, 0.03134918212890625, 0.03283214569091797, 0.03431510925292969, 0.035798072814941406, 0.037281036376953125, 0.038763999938964844, 0.04024696350097656, 0.04172992706298828, 0.043212890625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 4.0, 2.0, 8.0, 9.0, 10.0, 16.0, 13.0, 26.0, 44.0, 51.0, 85.0, 138.0, 182.0, 357.0, 541.0, 997.0, 1836.0, 3720.0, 8046.0, 18878.0, 54172.0, 206317.0, 2921042.0, 792066.0, 121942.0, 36944.0, 14187.0, 6116.0, 2859.0, 1525.0, 869.0, 478.0, 286.0, 156.0, 115.0, 75.0, 65.0, 32.0, 18.0, 13.0, 14.0, 9.0, 8.0, 5.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.25, -0.2423839569091797, -0.23476791381835938, -0.22715187072753906, -0.21953582763671875, -0.21191978454589844, -0.20430374145507812, -0.1966876983642578, -0.1890716552734375, -0.1814556121826172, -0.17383956909179688, -0.16622352600097656, -0.15860748291015625, -0.15099143981933594, -0.14337539672851562, -0.1357593536376953, -0.128143310546875, -0.12052726745605469, -0.11291122436523438, -0.10529518127441406, -0.09767913818359375, -0.09006309509277344, -0.08244705200195312, -0.07483100891113281, -0.0672149658203125, -0.05959892272949219, -0.051982879638671875, -0.04436683654785156, -0.03675079345703125, -0.029134750366210938, -0.021518707275390625, -0.013902664184570312, -0.00628662109375, 0.0013294219970703125, 0.008945465087890625, 0.016561508178710938, 0.02417755126953125, 0.03179359436035156, 0.039409637451171875, 0.04702568054199219, 0.0546417236328125, 0.06225776672363281, 0.06987380981445312, 0.07748985290527344, 0.08510589599609375, 0.09272193908691406, 0.10033798217773438, 0.10795402526855469, 0.115570068359375, 0.12318611145019531, 0.13080215454101562, 0.13841819763183594, 0.14603424072265625, 0.15365028381347656, 0.16126632690429688, 0.1688823699951172, 0.1764984130859375, 0.1841144561767578, 0.19173049926757812, 0.19934654235839844, 0.20696258544921875, 0.21457862854003906, 0.22219467163085938, 0.2298107147216797, 0.2374267578125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 5.0, 4.0, 6.0, 7.0, 13.0, 22.0, 26.0, 49.0, 61.0, 105.0, 181.0, 310.0, 924.0, 1484.0, 348.0, 180.0, 119.0, 62.0, 45.0, 33.0, 18.0, 17.0, 13.0, 15.0, 7.0, 4.0, 2.0, 1.0, 3.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1365966796875, -0.13291549682617188, -0.12923431396484375, -0.12555313110351562, -0.1218719482421875, -0.11819076538085938, -0.11450958251953125, -0.11082839965820312, -0.107147216796875, -0.10346603393554688, -0.09978485107421875, -0.09610366821289062, -0.0924224853515625, -0.08874130249023438, -0.08506011962890625, -0.08137893676757812, -0.07769775390625, -0.07401657104492188, -0.07033538818359375, -0.06665420532226562, -0.0629730224609375, -0.059291839599609375, -0.05561065673828125, -0.051929473876953125, -0.048248291015625, -0.044567108154296875, -0.04088592529296875, -0.037204742431640625, -0.0335235595703125, -0.029842376708984375, -0.02616119384765625, -0.022480010986328125, -0.018798828125, -0.015117645263671875, -0.01143646240234375, -0.007755279541015625, -0.0040740966796875, -0.000392913818359375, 0.00328826904296875, 0.006969451904296875, 0.010650634765625, 0.014331817626953125, 0.01801300048828125, 0.021694183349609375, 0.0253753662109375, 0.029056549072265625, 0.03273773193359375, 0.036418914794921875, 0.04010009765625, 0.043781280517578125, 0.04746246337890625, 0.051143646240234375, 0.0548248291015625, 0.058506011962890625, 0.06218719482421875, 0.06586837768554688, 0.069549560546875, 0.07323074340820312, 0.07691192626953125, 0.08059310913085938, 0.0842742919921875, 0.08795547485351562, 0.09163665771484375, 0.09531784057617188, 0.0989990234375]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 12.0, 21.0, 32.0, 64.0, 101.0, 110.0, 144.0, 143.0, 115.0, 100.0, 68.0, 41.0, 25.0, 9.0, 6.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9159307479858398, -0.8875405788421631, -0.8591504693031311, -0.8307603001594543, -0.8023701906204224, -0.7739800214767456, -0.7455899119377136, -0.7171997427940369, -0.6888096332550049, -0.6604194641113281, -0.6320293545722961, -0.6036391854286194, -0.5752490758895874, -0.5468589067459106, -0.5184687972068787, -0.4900786280632019, -0.46168848872184753, -0.43329834938049316, -0.4049082100391388, -0.3765180706977844, -0.34812793135643005, -0.3197377920150757, -0.2913476228713989, -0.26295751333236694, -0.23456735908985138, -0.206177219748497, -0.17778708040714264, -0.14939692616462708, -0.1210067942738533, -0.09261664748191833, -0.06422650814056396, -0.035836368799209595, -0.007446229457855225, 0.020943911746144295, 0.049334052950143814, 0.07772419601678848, 0.10611433535814285, 0.13450448215007782, 0.1628946214914322, 0.19128476083278656, 0.21967490017414093, 0.2480650395154953, 0.27645519375801086, 0.30484533309936523, 0.3332354724407196, 0.361625611782074, 0.39001575112342834, 0.4184058904647827, 0.4467960298061371, 0.47518616914749146, 0.5035763382911682, 0.5319664478302002, 0.560356616973877, 0.5887467265129089, 0.6171368956565857, 0.6455270051956177, 0.6739171743392944, 0.7023073434829712, 0.7306974530220032, 0.7590876221656799, 0.7874777317047119, 0.8158679008483887, 0.8442580103874207, 0.8726481795310974, 0.9010382890701294]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 5.0, 3.0, 4.0, 3.0, 9.0, 4.0, 6.0, 9.0, 10.0, 15.0, 19.0, 19.0, 30.0, 24.0, 30.0, 24.0, 34.0, 45.0, 41.0, 43.0, 32.0, 45.0, 24.0, 51.0, 58.0, 42.0, 42.0, 35.0, 38.0, 40.0, 32.0, 35.0, 30.0, 16.0, 15.0, 16.0, 14.0, 11.0, 13.0, 9.0, 8.0, 7.0, 4.0, 2.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.33580803871154785, -0.3247198462486267, -0.31363165378570557, -0.30254343152046204, -0.2914552390575409, -0.28036704659461975, -0.2692788243293762, -0.2581906318664551, -0.24710243940353394, -0.2360142469406128, -0.22492603957653046, -0.21383783221244812, -0.20274963974952698, -0.19166144728660583, -0.1805732399225235, -0.16948503255844116, -0.15839684009552002, -0.14730864763259888, -0.13622044026851654, -0.1251322329044342, -0.11404404044151306, -0.10295584052801132, -0.09186764061450958, -0.08077944070100784, -0.0696912407875061, -0.058603040874004364, -0.047514840960502625, -0.036426641047000885, -0.025338441133499146, -0.014250241219997406, -0.0031620413064956665, 0.007926158607006073, 0.019014358520507812, 0.030102558434009552, 0.04119075834751129, 0.05227895826101303, 0.06336715817451477, 0.07445535808801651, 0.08554355800151825, 0.09663175791501999, 0.10771995782852173, 0.11880815774202347, 0.1298963576555252, 0.14098456501960754, 0.1520727574825287, 0.16316094994544983, 0.17424915730953217, 0.1853373646736145, 0.19642555713653564, 0.2075137495994568, 0.21860195696353912, 0.22969016432762146, 0.2407783567905426, 0.25186654925346375, 0.2629547715187073, 0.2740429639816284, 0.28513115644454956, 0.2962193489074707, 0.30730754137039185, 0.3183957636356354, 0.3294839560985565, 0.34057214856147766, 0.3516603708267212, 0.36274856328964233, 0.3738367557525635]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 9.0, 8.0, 14.0, 18.0, 21.0, 32.0, 53.0, 80.0, 127.0, 181.0, 328.0, 539.0, 938.0, 1753.0, 3229.0, 6028.0, 11405.0, 21016.0, 39181.0, 69437.0, 124418.0, 244205.0, 245380.0, 124887.0, 69977.0, 39148.0, 21332.0, 11461.0, 6215.0, 3103.0, 1700.0, 914.0, 530.0, 324.0, 174.0, 128.0, 89.0, 48.0, 41.0, 28.0, 17.0, 16.0, 12.0, 2.0, 4.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0], "bins": [-0.1279296875, -0.12416744232177734, -0.12040519714355469, -0.11664295196533203, -0.11288070678710938, -0.10911846160888672, -0.10535621643066406, -0.1015939712524414, -0.09783172607421875, -0.0940694808959961, -0.09030723571777344, -0.08654499053955078, -0.08278274536132812, -0.07902050018310547, -0.07525825500488281, -0.07149600982666016, -0.0677337646484375, -0.06397151947021484, -0.06020927429199219, -0.05644702911376953, -0.052684783935546875, -0.04892253875732422, -0.04516029357910156, -0.041398048400878906, -0.03763580322265625, -0.033873558044433594, -0.030111312866210938, -0.02634906768798828, -0.022586822509765625, -0.01882457733154297, -0.015062332153320312, -0.011300086975097656, -0.007537841796875, -0.0037755966186523438, -1.33514404296875e-05, 0.0037488937377929688, 0.007511138916015625, 0.011273384094238281, 0.015035629272460938, 0.018797874450683594, 0.02256011962890625, 0.026322364807128906, 0.030084609985351562, 0.03384685516357422, 0.037609100341796875, 0.04137134552001953, 0.04513359069824219, 0.048895835876464844, 0.0526580810546875, 0.056420326232910156, 0.06018257141113281, 0.06394481658935547, 0.06770706176757812, 0.07146930694580078, 0.07523155212402344, 0.0789937973022461, 0.08275604248046875, 0.0865182876586914, 0.09028053283691406, 0.09404277801513672, 0.09780502319335938, 0.10156726837158203, 0.10532951354980469, 0.10909175872802734, 0.11285400390625]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 4.0, 6.0, 8.0, 11.0, 13.0, 11.0, 15.0, 13.0, 18.0, 29.0, 32.0, 35.0, 36.0, 31.0, 41.0, 40.0, 53.0, 57.0, 43.0, 55.0, 66.0, 50.0, 43.0, 46.0, 36.0, 29.0, 26.0, 29.0, 27.0, 27.0, 11.0, 13.0, 14.0, 10.0, 4.0, 6.0, 6.0, 10.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.0511474609375, -0.04968118667602539, -0.04821491241455078, -0.04674863815307617, -0.04528236389160156, -0.04381608963012695, -0.042349815368652344, -0.040883541107177734, -0.039417266845703125, -0.037950992584228516, -0.036484718322753906, -0.0350184440612793, -0.03355216979980469, -0.03208589553833008, -0.03061962127685547, -0.02915334701538086, -0.02768707275390625, -0.02622079849243164, -0.02475452423095703, -0.023288249969482422, -0.021821975708007812, -0.020355701446533203, -0.018889427185058594, -0.017423152923583984, -0.015956878662109375, -0.014490604400634766, -0.013024330139160156, -0.011558055877685547, -0.010091781616210938, -0.008625507354736328, -0.007159233093261719, -0.005692958831787109, -0.0042266845703125, -0.0027604103088378906, -0.0012941360473632812, 0.00017213821411132812, 0.0016384124755859375, 0.003104686737060547, 0.004570960998535156, 0.006037235260009766, 0.007503509521484375, 0.008969783782958984, 0.010436058044433594, 0.011902332305908203, 0.013368606567382812, 0.014834880828857422, 0.01630115509033203, 0.01776742935180664, 0.01923370361328125, 0.02069997787475586, 0.02216625213623047, 0.023632526397705078, 0.025098800659179688, 0.026565074920654297, 0.028031349182128906, 0.029497623443603516, 0.030963897705078125, 0.032430171966552734, 0.033896446228027344, 0.03536272048950195, 0.03682899475097656, 0.03829526901245117, 0.03976154327392578, 0.04122781753540039, 0.042694091796875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 6.0, 5.0, 8.0, 9.0, 29.0, 25.0, 25.0, 41.0, 54.0, 87.0, 108.0, 161.0, 235.0, 311.0, 473.0, 833.0, 1602.0, 4506.0, 20114.0, 109364.0, 605977.0, 244796.0, 45561.0, 8749.0, 2484.0, 1075.0, 612.0, 401.0, 268.0, 171.0, 133.0, 92.0, 62.0, 55.0, 31.0, 28.0, 11.0, 14.0, 11.0, 8.0, 4.0, 6.0, 5.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.315673828125, -0.3057289123535156, -0.29578399658203125, -0.2858390808105469, -0.2758941650390625, -0.2659492492675781, -0.25600433349609375, -0.24605941772460938, -0.236114501953125, -0.22616958618164062, -0.21622467041015625, -0.20627975463867188, -0.1963348388671875, -0.18638992309570312, -0.17644500732421875, -0.16650009155273438, -0.15655517578125, -0.14661026000976562, -0.13666534423828125, -0.12672042846679688, -0.1167755126953125, -0.10683059692382812, -0.09688568115234375, -0.08694076538085938, -0.076995849609375, -0.06705093383789062, -0.05710601806640625, -0.047161102294921875, -0.0372161865234375, -0.027271270751953125, -0.01732635498046875, -0.007381439208984375, 0.0025634765625, 0.012508392333984375, 0.02245330810546875, 0.032398223876953125, 0.0423431396484375, 0.052288055419921875, 0.06223297119140625, 0.07217788696289062, 0.082122802734375, 0.09206771850585938, 0.10201263427734375, 0.11195755004882812, 0.1219024658203125, 0.13184738159179688, 0.14179229736328125, 0.15173721313476562, 0.16168212890625, 0.17162704467773438, 0.18157196044921875, 0.19151687622070312, 0.2014617919921875, 0.21140670776367188, 0.22135162353515625, 0.23129653930664062, 0.241241455078125, 0.2511863708496094, 0.26113128662109375, 0.2710762023925781, 0.2810211181640625, 0.2909660339355469, 0.30091094970703125, 0.3108558654785156, 0.32080078125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 4.0, 5.0, 4.0, 4.0, 8.0, 9.0, 9.0, 9.0, 19.0, 16.0, 19.0, 24.0, 28.0, 25.0, 32.0, 49.0, 41.0, 46.0, 46.0, 59.0, 43.0, 57.0, 58.0, 46.0, 58.0, 54.0, 33.0, 28.0, 28.0, 23.0, 18.0, 22.0, 18.0, 16.0, 10.0, 6.0, 6.0, 7.0, 4.0, 5.0, 3.0, 1.0, 4.0, 2.0, 0.0, 1.0, 4.0, 2.0, 0.0, 1.0], "bins": [-0.253662109375, -0.2463550567626953, -0.23904800415039062, -0.23174095153808594, -0.22443389892578125, -0.21712684631347656, -0.20981979370117188, -0.2025127410888672, -0.1952056884765625, -0.1878986358642578, -0.18059158325195312, -0.17328453063964844, -0.16597747802734375, -0.15867042541503906, -0.15136337280273438, -0.1440563201904297, -0.136749267578125, -0.1294422149658203, -0.12213516235351562, -0.11482810974121094, -0.10752105712890625, -0.10021400451660156, -0.09290695190429688, -0.08559989929199219, -0.0782928466796875, -0.07098579406738281, -0.06367874145507812, -0.05637168884277344, -0.04906463623046875, -0.04175758361816406, -0.034450531005859375, -0.027143478393554688, -0.01983642578125, -0.012529373168945312, -0.005222320556640625, 0.0020847320556640625, 0.00939178466796875, 0.016698837280273438, 0.024005889892578125, 0.03131294250488281, 0.0386199951171875, 0.04592704772949219, 0.053234100341796875, 0.06054115295410156, 0.06784820556640625, 0.07515525817871094, 0.08246231079101562, 0.08976936340332031, 0.097076416015625, 0.10438346862792969, 0.11169052124023438, 0.11899757385253906, 0.12630462646484375, 0.13361167907714844, 0.14091873168945312, 0.1482257843017578, 0.1555328369140625, 0.1628398895263672, 0.17014694213867188, 0.17745399475097656, 0.18476104736328125, 0.19206809997558594, 0.19937515258789062, 0.2066822052001953, 0.2139892578125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 3.0, 2.0, 6.0, 5.0, 6.0, 10.0, 22.0, 17.0, 22.0, 48.0, 77.0, 131.0, 180.0, 324.0, 627.0, 1199.0, 2640.0, 6579.0, 20433.0, 84140.0, 476590.0, 355924.0, 71258.0, 17546.0, 5820.0, 2329.0, 1183.0, 591.0, 322.0, 180.0, 127.0, 76.0, 37.0, 30.0, 29.0, 12.0, 7.0, 7.0, 7.0, 7.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1700439453125, -0.1647205352783203, -0.15939712524414062, -0.15407371520996094, -0.14875030517578125, -0.14342689514160156, -0.13810348510742188, -0.1327800750732422, -0.1274566650390625, -0.12213325500488281, -0.11680984497070312, -0.11148643493652344, -0.10616302490234375, -0.10083961486816406, -0.09551620483398438, -0.09019279479980469, -0.084869384765625, -0.07954597473144531, -0.07422256469726562, -0.06889915466308594, -0.06357574462890625, -0.05825233459472656, -0.052928924560546875, -0.04760551452636719, -0.0422821044921875, -0.03695869445800781, -0.031635284423828125, -0.026311874389648438, -0.02098846435546875, -0.015665054321289062, -0.010341644287109375, -0.0050182342529296875, 0.00030517578125, 0.0056285858154296875, 0.010951995849609375, 0.016275405883789062, 0.02159881591796875, 0.026922225952148438, 0.032245635986328125, 0.03756904602050781, 0.0428924560546875, 0.04821586608886719, 0.053539276123046875, 0.05886268615722656, 0.06418609619140625, 0.06950950622558594, 0.07483291625976562, 0.08015632629394531, 0.085479736328125, 0.09080314636230469, 0.09612655639648438, 0.10144996643066406, 0.10677337646484375, 0.11209678649902344, 0.11742019653320312, 0.12274360656738281, 0.1280670166015625, 0.1333904266357422, 0.13871383666992188, 0.14403724670410156, 0.14936065673828125, 0.15468406677246094, 0.16000747680664062, 0.1653308868408203, 0.170654296875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 9.0, 1.0, 2.0, 5.0, 4.0, 12.0, 13.0, 22.0, 20.0, 29.0, 33.0, 56.0, 73.0, 89.0, 98.0, 108.0, 102.0, 78.0, 80.0, 44.0, 28.0, 32.0, 19.0, 18.0, 12.0, 10.0, 6.0, 4.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.177757263183594e-05, -7.812492549419403e-05, -7.447227835655212e-05, -7.081963121891022e-05, -6.716698408126831e-05, -6.35143369436264e-05, -5.98616898059845e-05, -5.620904266834259e-05, -5.2556395530700684e-05, -4.890374839305878e-05, -4.525110125541687e-05, -4.159845411777496e-05, -3.794580698013306e-05, -3.429315984249115e-05, -3.064051270484924e-05, -2.6987865567207336e-05, -2.333521842956543e-05, -1.9682571291923523e-05, -1.6029924154281616e-05, -1.237727701663971e-05, -8.724629878997803e-06, -5.071982741355896e-06, -1.4193356037139893e-06, 2.2333115339279175e-06, 5.885958671569824e-06, 9.538605809211731e-06, 1.3191252946853638e-05, 1.6843900084495544e-05, 2.049654722213745e-05, 2.4149194359779358e-05, 2.7801841497421265e-05, 3.145448863506317e-05, 3.510713577270508e-05, 3.8759782910346985e-05, 4.241243004798889e-05, 4.60650771856308e-05, 4.9717724323272705e-05, 5.337037146091461e-05, 5.702301859855652e-05, 6.0675665736198425e-05, 6.432831287384033e-05, 6.798096001148224e-05, 7.163360714912415e-05, 7.528625428676605e-05, 7.893890142440796e-05, 8.259154856204987e-05, 8.624419569969177e-05, 8.989684283733368e-05, 9.354948997497559e-05, 9.720213711261749e-05, 0.0001008547842502594, 0.0001045074313879013, 0.00010816007852554321, 0.00011181272566318512, 0.00011546537280082703, 0.00011911801993846893, 0.00012277066707611084, 0.00012642331421375275, 0.00013007596135139465, 0.00013372860848903656, 0.00013738125562667847, 0.00014103390276432037, 0.00014468654990196228, 0.0001483391970396042, 0.0001519918441772461]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 3.0, 7.0, 6.0, 10.0, 3.0, 19.0, 20.0, 31.0, 62.0, 70.0, 122.0, 179.0, 336.0, 617.0, 1425.0, 3948.0, 16633.0, 106360.0, 676025.0, 204504.0, 28449.0, 5963.0, 1938.0, 811.0, 417.0, 234.0, 119.0, 78.0, 58.0, 41.0, 15.0, 10.0, 12.0, 9.0, 3.0, 5.0, 4.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2337646484375, -0.2266063690185547, -0.21944808959960938, -0.21228981018066406, -0.20513153076171875, -0.19797325134277344, -0.19081497192382812, -0.1836566925048828, -0.1764984130859375, -0.1693401336669922, -0.16218185424804688, -0.15502357482910156, -0.14786529541015625, -0.14070701599121094, -0.13354873657226562, -0.1263904571533203, -0.119232177734375, -0.11207389831542969, -0.10491561889648438, -0.09775733947753906, -0.09059906005859375, -0.08344078063964844, -0.07628250122070312, -0.06912422180175781, -0.0619659423828125, -0.05480766296386719, -0.047649383544921875, -0.04049110412597656, -0.03333282470703125, -0.026174545288085938, -0.019016265869140625, -0.011857986450195312, -0.00469970703125, 0.0024585723876953125, 0.009616851806640625, 0.016775131225585938, 0.02393341064453125, 0.031091690063476562, 0.038249969482421875, 0.04540824890136719, 0.0525665283203125, 0.05972480773925781, 0.06688308715820312, 0.07404136657714844, 0.08119964599609375, 0.08835792541503906, 0.09551620483398438, 0.10267448425292969, 0.109832763671875, 0.11699104309082031, 0.12414932250976562, 0.13130760192871094, 0.13846588134765625, 0.14562416076660156, 0.15278244018554688, 0.1599407196044922, 0.1670989990234375, 0.1742572784423828, 0.18141555786132812, 0.18857383728027344, 0.19573211669921875, 0.20289039611816406, 0.21004867553710938, 0.2172069549560547, 0.224365234375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 5.0, 4.0, 4.0, 7.0, 9.0, 14.0, 13.0, 21.0, 21.0, 19.0, 20.0, 25.0, 54.0, 54.0, 80.0, 84.0, 97.0, 85.0, 77.0, 64.0, 45.0, 32.0, 34.0, 25.0, 23.0, 21.0, 15.0, 8.0, 12.0, 7.0, 3.0, 6.0, 5.0, 4.0, 5.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1300048828125, -0.12613773345947266, -0.12227058410644531, -0.11840343475341797, -0.11453628540039062, -0.11066913604736328, -0.10680198669433594, -0.1029348373413086, -0.09906768798828125, -0.0952005386352539, -0.09133338928222656, -0.08746623992919922, -0.08359909057617188, -0.07973194122314453, -0.07586479187011719, -0.07199764251708984, -0.0681304931640625, -0.06426334381103516, -0.06039619445800781, -0.05652904510498047, -0.052661895751953125, -0.04879474639892578, -0.04492759704589844, -0.041060447692871094, -0.03719329833984375, -0.033326148986816406, -0.029458999633789062, -0.02559185028076172, -0.021724700927734375, -0.01785755157470703, -0.013990402221679688, -0.010123252868652344, -0.006256103515625, -0.0023889541625976562, 0.0014781951904296875, 0.005345344543457031, 0.009212493896484375, 0.013079643249511719, 0.016946792602539062, 0.020813941955566406, 0.02468109130859375, 0.028548240661621094, 0.03241539001464844, 0.03628253936767578, 0.040149688720703125, 0.04401683807373047, 0.04788398742675781, 0.051751136779785156, 0.0556182861328125, 0.059485435485839844, 0.06335258483886719, 0.06721973419189453, 0.07108688354492188, 0.07495403289794922, 0.07882118225097656, 0.0826883316040039, 0.08655548095703125, 0.0904226303100586, 0.09428977966308594, 0.09815692901611328, 0.10202407836914062, 0.10589122772216797, 0.10975837707519531, 0.11362552642822266, 0.11749267578125]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 7.0, 5.0, 17.0, 61.0, 104.0, 174.0, 193.0, 195.0, 133.0, 70.0, 35.0, 10.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.692439556121826, -4.590233325958252, -4.4880266189575195, -4.385820388793945, -4.283614158630371, -4.181407451629639, -4.0792012214660645, -3.976994752883911, -3.874788284301758, -3.7725818157196045, -3.670375347137451, -3.568169116973877, -3.4659626483917236, -3.3637561798095703, -3.261549949645996, -3.1593434810638428, -3.0571370124816895, -2.954930543899536, -2.852724075317383, -2.7505178451538086, -2.6483113765716553, -2.546104907989502, -2.4438986778259277, -2.3416922092437744, -2.239485740661621, -2.1372792720794678, -2.0350728034973145, -1.9328665733337402, -1.830660104751587, -1.7284536361694336, -1.6262472867965698, -1.524040937423706, -1.4218345880508423, -1.3196282386779785, -1.2174217700958252, -1.1152153015136719, -1.013008952140808, -0.9108025431632996, -0.808596134185791, -0.7063897252082825, -0.6041833162307739, -0.5019769072532654, -0.39977049827575684, -0.2975640892982483, -0.19535768032073975, -0.0931512713432312, 0.009055137634277344, 0.11126154661178589, 0.21346795558929443, 0.315674364566803, 0.4178807735443115, 0.5200871825218201, 0.6222935914993286, 0.7245000004768372, 0.8267064094543457, 0.9289128184318542, 1.0311192274093628, 1.1333255767822266, 1.2355320453643799, 1.3377385139465332, 1.439944863319397, 1.5421512126922607, 1.644357681274414, 1.7465641498565674, 1.8487704992294312]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 5.0, 3.0, 1.0, 8.0, 8.0, 8.0, 6.0, 12.0, 13.0, 9.0, 23.0, 25.0, 20.0, 28.0, 23.0, 34.0, 42.0, 42.0, 42.0, 51.0, 50.0, 41.0, 58.0, 41.0, 42.0, 39.0, 40.0, 32.0, 40.0, 43.0, 35.0, 29.0, 20.0, 21.0, 12.0, 14.0, 12.0, 8.0, 5.0, 12.0, 4.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1537410020828247, -1.1154236793518066, -1.0771063566207886, -1.0387890338897705, -1.0004717111587524, -0.9621543884277344, -0.9238371253013611, -0.885519802570343, -0.847202479839325, -0.8088851571083069, -0.7705678343772888, -0.7322505116462708, -0.6939332485198975, -0.6556159257888794, -0.6172986030578613, -0.5789812803268433, -0.5406639575958252, -0.5023466348648071, -0.46402931213378906, -0.4257120192050934, -0.3873946964740753, -0.34907737374305725, -0.3107600808143616, -0.2724427580833435, -0.23412543535232544, -0.19580811262130737, -0.1574908047914505, -0.11917348951101303, -0.08085617423057556, -0.042538851499557495, -0.0042215436697006226, 0.03409576416015625, 0.07241296768188477, 0.11073028296232224, 0.1490475982427597, 0.18736490607261658, 0.22568222880363464, 0.2639995515346527, 0.3023168444633484, 0.34063416719436646, 0.3789514899253845, 0.4172688126564026, 0.45558613538742065, 0.49390342831611633, 0.532220721244812, 0.5705380439758301, 0.6088553667068481, 0.6471726894378662, 0.6854900121688843, 0.7238073348999023, 0.7621246576309204, 0.8004419803619385, 0.8387593030929565, 0.8770766258239746, 0.9153938889503479, 0.953711211681366, 0.992028534412384, 1.0303457975387573, 1.0686631202697754, 1.1069804430007935, 1.1452977657318115, 1.1836150884628296, 1.2219324111938477, 1.2602497339248657, 1.2985670566558838]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 3.0, 4.0, 3.0, 3.0, 7.0, 12.0, 10.0, 25.0, 44.0, 54.0, 75.0, 102.0, 161.0, 280.0, 466.0, 835.0, 1509.0, 3048.0, 6090.0, 14360.0, 36824.0, 122517.0, 795855.0, 2900838.0, 218077.0, 56658.0, 19975.0, 8243.0, 3715.0, 1953.0, 978.0, 600.0, 337.0, 196.0, 133.0, 93.0, 61.0, 37.0, 33.0, 18.0, 22.0, 5.0, 6.0, 3.0, 10.0, 2.0, 1.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.20751953125, -0.20064544677734375, -0.1937713623046875, -0.18689727783203125, -0.180023193359375, -0.17314910888671875, -0.1662750244140625, -0.15940093994140625, -0.15252685546875, -0.14565277099609375, -0.1387786865234375, -0.13190460205078125, -0.125030517578125, -0.11815643310546875, -0.1112823486328125, -0.10440826416015625, -0.0975341796875, -0.09066009521484375, -0.0837860107421875, -0.07691192626953125, -0.070037841796875, -0.06316375732421875, -0.0562896728515625, -0.04941558837890625, -0.04254150390625, -0.03566741943359375, -0.0287933349609375, -0.02191925048828125, -0.015045166015625, -0.00817108154296875, -0.0012969970703125, 0.00557708740234375, 0.012451171875, 0.01932525634765625, 0.0261993408203125, 0.03307342529296875, 0.039947509765625, 0.04682159423828125, 0.0536956787109375, 0.06056976318359375, 0.06744384765625, 0.07431793212890625, 0.0811920166015625, 0.08806610107421875, 0.094940185546875, 0.10181427001953125, 0.1086883544921875, 0.11556243896484375, 0.1224365234375, 0.12931060791015625, 0.1361846923828125, 0.14305877685546875, 0.149932861328125, 0.15680694580078125, 0.1636810302734375, 0.17055511474609375, 0.17742919921875, 0.18430328369140625, 0.1911773681640625, 0.19805145263671875, 0.204925537109375, 0.21179962158203125, 0.2186737060546875, 0.22554779052734375, 0.232421875]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 0.0, 3.0, 5.0, 4.0, 4.0, 10.0, 11.0, 11.0, 16.0, 14.0, 16.0, 22.0, 19.0, 30.0, 33.0, 27.0, 33.0, 32.0, 35.0, 42.0, 41.0, 35.0, 41.0, 53.0, 30.0, 48.0, 38.0, 39.0, 42.0, 39.0, 33.0, 39.0, 26.0, 18.0, 17.0, 13.0, 20.0, 11.0, 12.0, 10.0, 11.0, 6.0, 9.0, 3.0, 5.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.046966552734375, -0.04559326171875, -0.044219970703125, -0.0428466796875, -0.041473388671875, -0.04010009765625, -0.038726806640625, -0.037353515625, -0.035980224609375, -0.03460693359375, -0.033233642578125, -0.0318603515625, -0.030487060546875, -0.02911376953125, -0.027740478515625, -0.0263671875, -0.024993896484375, -0.02362060546875, -0.022247314453125, -0.0208740234375, -0.019500732421875, -0.01812744140625, -0.016754150390625, -0.015380859375, -0.014007568359375, -0.01263427734375, -0.011260986328125, -0.0098876953125, -0.008514404296875, -0.00714111328125, -0.005767822265625, -0.00439453125, -0.003021240234375, -0.00164794921875, -0.000274658203125, 0.0010986328125, 0.002471923828125, 0.00384521484375, 0.005218505859375, 0.006591796875, 0.007965087890625, 0.00933837890625, 0.010711669921875, 0.0120849609375, 0.013458251953125, 0.01483154296875, 0.016204833984375, 0.017578125, 0.018951416015625, 0.02032470703125, 0.021697998046875, 0.0230712890625, 0.024444580078125, 0.02581787109375, 0.027191162109375, 0.028564453125, 0.029937744140625, 0.03131103515625, 0.032684326171875, 0.0340576171875, 0.035430908203125, 0.03680419921875, 0.038177490234375, 0.03955078125, 0.040924072265625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 4.0, 4.0, 5.0, 8.0, 13.0, 20.0, 23.0, 29.0, 39.0, 58.0, 85.0, 112.0, 160.0, 238.0, 341.0, 499.0, 831.0, 1289.0, 2094.0, 3852.0, 7056.0, 14072.0, 30398.0, 73995.0, 218197.0, 1228211.0, 2186493.0, 269643.0, 87062.0, 35223.0, 15843.0, 7788.0, 4311.0, 2273.0, 1400.0, 862.0, 537.0, 388.0, 247.0, 176.0, 120.0, 96.0, 47.0, 37.0, 23.0, 26.0, 22.0, 10.0, 10.0, 5.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 4.0], "bins": [-0.2239990234375, -0.21722793579101562, -0.21045684814453125, -0.20368576049804688, -0.1969146728515625, -0.19014358520507812, -0.18337249755859375, -0.17660140991210938, -0.169830322265625, -0.16305923461914062, -0.15628814697265625, -0.14951705932617188, -0.1427459716796875, -0.13597488403320312, -0.12920379638671875, -0.12243270874023438, -0.11566162109375, -0.10889053344726562, -0.10211944580078125, -0.09534835815429688, -0.0885772705078125, -0.08180618286132812, -0.07503509521484375, -0.06826400756835938, -0.061492919921875, -0.054721832275390625, -0.04795074462890625, -0.041179656982421875, -0.0344085693359375, -0.027637481689453125, -0.02086639404296875, -0.014095306396484375, -0.00732421875, -0.000553131103515625, 0.00621795654296875, 0.012989044189453125, 0.0197601318359375, 0.026531219482421875, 0.03330230712890625, 0.040073394775390625, 0.046844482421875, 0.053615570068359375, 0.06038665771484375, 0.06715774536132812, 0.0739288330078125, 0.08069992065429688, 0.08747100830078125, 0.09424209594726562, 0.10101318359375, 0.10778427124023438, 0.11455535888671875, 0.12132644653320312, 0.1280975341796875, 0.13486862182617188, 0.14163970947265625, 0.14841079711914062, 0.155181884765625, 0.16195297241210938, 0.16872406005859375, 0.17549514770507812, 0.1822662353515625, 0.18903732299804688, 0.19580841064453125, 0.20257949829101562, 0.2093505859375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 7.0, 5.0, 5.0, 6.0, 19.0, 5.0, 23.0, 24.0, 29.0, 46.0, 67.0, 104.0, 128.0, 223.0, 381.0, 837.0, 1059.0, 354.0, 241.0, 126.0, 110.0, 78.0, 49.0, 32.0, 33.0, 17.0, 8.0, 16.0, 10.0, 9.0, 6.0, 1.0, 9.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.1441650390625, -0.1398029327392578, -0.13544082641601562, -0.13107872009277344, -0.12671661376953125, -0.12235450744628906, -0.11799240112304688, -0.11363029479980469, -0.1092681884765625, -0.10490608215332031, -0.10054397583007812, -0.09618186950683594, -0.09181976318359375, -0.08745765686035156, -0.08309555053710938, -0.07873344421386719, -0.074371337890625, -0.07000923156738281, -0.06564712524414062, -0.06128501892089844, -0.05692291259765625, -0.05256080627441406, -0.048198699951171875, -0.04383659362792969, -0.0394744873046875, -0.03511238098144531, -0.030750274658203125, -0.026388168334960938, -0.02202606201171875, -0.017663955688476562, -0.013301849365234375, -0.008939743041992188, -0.00457763671875, -0.0002155303955078125, 0.004146575927734375, 0.008508682250976562, 0.01287078857421875, 0.017232894897460938, 0.021595001220703125, 0.025957107543945312, 0.0303192138671875, 0.03468132019042969, 0.039043426513671875, 0.04340553283691406, 0.04776763916015625, 0.05212974548339844, 0.056491851806640625, 0.06085395812988281, 0.065216064453125, 0.06957817077636719, 0.07394027709960938, 0.07830238342285156, 0.08266448974609375, 0.08702659606933594, 0.09138870239257812, 0.09575080871582031, 0.1001129150390625, 0.10447502136230469, 0.10883712768554688, 0.11319923400878906, 0.11756134033203125, 0.12192344665527344, 0.12628555297851562, 0.1306476593017578, 0.135009765625]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 7.0, 12.0, 21.0, 32.0, 56.0, 104.0, 145.0, 160.0, 145.0, 123.0, 88.0, 42.0, 38.0, 19.0, 7.0, 5.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.285744547843933, -1.2390635013580322, -1.1923824548721313, -1.1457014083862305, -1.0990204811096191, -1.0523394346237183, -1.0056583881378174, -0.9589773416519165, -0.9122962951660156, -0.8656152486801147, -0.8189342021942139, -0.7722532153129578, -0.7255721688270569, -0.678891122341156, -0.6322101354598999, -0.585529088973999, -0.5388480424880981, -0.49216699600219727, -0.4454859793186188, -0.3988049626350403, -0.3521239161491394, -0.3054428696632385, -0.25876185297966003, -0.21208083629608154, -0.16539978981018066, -0.11871875822544098, -0.0720377266407013, -0.02535669505596161, 0.021324336528778076, 0.06800536811351776, 0.11468639969825745, 0.16136741638183594, 0.20804858207702637, 0.25472962856292725, 0.30141064524650574, 0.34809166193008423, 0.3947727084159851, 0.441453754901886, 0.4881347715854645, 0.534815788269043, 0.5814968347549438, 0.6281778812408447, 0.6748589277267456, 0.7215399146080017, 0.7682209610939026, 0.8149020075798035, 0.8615829944610596, 0.9082640409469604, 0.9549450874328613, 1.0016261339187622, 1.048307180404663, 1.094988226890564, 1.1416692733764648, 1.1883502006530762, 1.235031247138977, 1.281712293624878, 1.3283933401107788, 1.3750743865966797, 1.4217554330825806, 1.4684364795684814, 1.5151174068450928, 1.5617984533309937, 1.6084794998168945, 1.6551605463027954, 1.7018415927886963]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 6.0, 4.0, 8.0, 4.0, 8.0, 10.0, 16.0, 18.0, 23.0, 25.0, 25.0, 23.0, 23.0, 30.0, 33.0, 41.0, 40.0, 40.0, 34.0, 44.0, 31.0, 39.0, 33.0, 33.0, 32.0, 34.0, 37.0, 30.0, 28.0, 23.0, 26.0, 19.0, 27.0, 25.0, 16.0, 17.0, 15.0, 16.0, 8.0, 7.0, 9.0, 11.0, 8.0, 9.0, 5.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.4640202522277832, -0.449476957321167, -0.4349336326122284, -0.4203903377056122, -0.40584704279899597, -0.3913037180900574, -0.37676042318344116, -0.36221712827682495, -0.34767383337020874, -0.33313053846359253, -0.31858721375465393, -0.3040439188480377, -0.2895006239414215, -0.2749572992324829, -0.2604140043258667, -0.2458707094192505, -0.2313273847103119, -0.21678407490253448, -0.20224077999591827, -0.18769747018814087, -0.17315417528152466, -0.15861086547374725, -0.14406755566596985, -0.12952426075935364, -0.11498095095157623, -0.10043764859437943, -0.08589434623718262, -0.07135103642940521, -0.056807734072208405, -0.0422644317150116, -0.027721121907234192, -0.013177819550037384, 0.0013654828071594238, 0.01590878702700138, 0.030452091246843338, 0.044995397329330444, 0.05953869968652725, 0.07408200204372406, 0.08862531185150146, 0.10316861420869827, 0.11771191656589508, 0.13225522637367249, 0.1467985212802887, 0.1613418310880661, 0.1758851408958435, 0.19042843580245972, 0.20497174561023712, 0.21951505541801453, 0.23405835032463074, 0.24860166013240814, 0.26314496994018555, 0.27768826484680176, 0.29223155975341797, 0.3067748546600342, 0.3213181793689728, 0.335861474275589, 0.3504047989845276, 0.3649480938911438, 0.3794914186000824, 0.3940347135066986, 0.4085780084133148, 0.4231213331222534, 0.43766462802886963, 0.45220792293548584, 0.46675121784210205]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 4.0, 7.0, 3.0, 10.0, 12.0, 15.0, 17.0, 33.0, 46.0, 53.0, 94.0, 135.0, 212.0, 316.0, 487.0, 770.0, 1330.0, 2167.0, 3886.0, 6420.0, 10918.0, 18418.0, 31756.0, 53653.0, 88780.0, 135925.0, 179940.0, 176671.0, 130271.0, 83673.0, 50498.0, 29663.0, 17404.0, 10225.0, 5889.0, 3427.0, 2006.0, 1224.0, 798.0, 466.0, 309.0, 210.0, 118.0, 94.0, 61.0, 34.0, 36.0, 22.0, 17.0, 6.0, 12.0, 9.0, 3.0, 2.0, 3.0, 3.0, 2.0, 2.0], "bins": [-0.11029052734375, -0.10694217681884766, -0.10359382629394531, -0.10024547576904297, -0.09689712524414062, -0.09354877471923828, -0.09020042419433594, -0.0868520736694336, -0.08350372314453125, -0.0801553726196289, -0.07680702209472656, -0.07345867156982422, -0.07011032104492188, -0.06676197052001953, -0.06341361999511719, -0.060065269470214844, -0.0567169189453125, -0.053368568420410156, -0.05002021789550781, -0.04667186737060547, -0.043323516845703125, -0.03997516632080078, -0.03662681579589844, -0.033278465270996094, -0.02993011474609375, -0.026581764221191406, -0.023233413696289062, -0.01988506317138672, -0.016536712646484375, -0.013188362121582031, -0.009840011596679688, -0.006491661071777344, -0.003143310546875, 0.00020503997802734375, 0.0035533905029296875, 0.006901741027832031, 0.010250091552734375, 0.013598442077636719, 0.016946792602539062, 0.020295143127441406, 0.02364349365234375, 0.026991844177246094, 0.030340194702148438, 0.03368854522705078, 0.037036895751953125, 0.04038524627685547, 0.04373359680175781, 0.047081947326660156, 0.0504302978515625, 0.053778648376464844, 0.05712699890136719, 0.06047534942626953, 0.06382369995117188, 0.06717205047607422, 0.07052040100097656, 0.0738687515258789, 0.07721710205078125, 0.0805654525756836, 0.08391380310058594, 0.08726215362548828, 0.09061050415039062, 0.09395885467529297, 0.09730720520019531, 0.10065555572509766, 0.10400390625]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 4.0, 2.0, 4.0, 3.0, 9.0, 5.0, 8.0, 5.0, 16.0, 17.0, 7.0, 15.0, 20.0, 30.0, 21.0, 19.0, 27.0, 31.0, 30.0, 36.0, 36.0, 36.0, 44.0, 40.0, 56.0, 51.0, 46.0, 39.0, 32.0, 44.0, 26.0, 31.0, 26.0, 26.0, 24.0, 21.0, 17.0, 18.0, 7.0, 16.0, 17.0, 10.0, 13.0, 7.0, 5.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.046844482421875, -0.045360565185546875, -0.04387664794921875, -0.042392730712890625, -0.0409088134765625, -0.039424896240234375, -0.03794097900390625, -0.036457061767578125, -0.03497314453125, -0.033489227294921875, -0.03200531005859375, -0.030521392822265625, -0.0290374755859375, -0.027553558349609375, -0.02606964111328125, -0.024585723876953125, -0.023101806640625, -0.021617889404296875, -0.02013397216796875, -0.018650054931640625, -0.0171661376953125, -0.015682220458984375, -0.01419830322265625, -0.012714385986328125, -0.01123046875, -0.009746551513671875, -0.00826263427734375, -0.006778717041015625, -0.0052947998046875, -0.003810882568359375, -0.00232696533203125, -0.000843048095703125, 0.000640869140625, 0.002124786376953125, 0.00360870361328125, 0.005092620849609375, 0.0065765380859375, 0.008060455322265625, 0.00954437255859375, 0.011028289794921875, 0.01251220703125, 0.013996124267578125, 0.01548004150390625, 0.016963958740234375, 0.0184478759765625, 0.019931793212890625, 0.02141571044921875, 0.022899627685546875, 0.024383544921875, 0.025867462158203125, 0.02735137939453125, 0.028835296630859375, 0.0303192138671875, 0.031803131103515625, 0.03328704833984375, 0.034770965576171875, 0.0362548828125, 0.037738800048828125, 0.03922271728515625, 0.040706634521484375, 0.0421905517578125, 0.043674468994140625, 0.04515838623046875, 0.046642303466796875, 0.048126220703125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 2.0, 6.0, 7.0, 6.0, 9.0, 18.0, 21.0, 18.0, 30.0, 45.0, 69.0, 82.0, 126.0, 158.0, 255.0, 353.0, 543.0, 957.0, 1945.0, 6638.0, 32432.0, 197431.0, 589654.0, 177483.0, 29631.0, 6091.0, 1927.0, 878.0, 523.0, 336.0, 246.0, 181.0, 141.0, 76.0, 68.0, 41.0, 31.0, 24.0, 30.0, 14.0, 11.0, 8.0, 6.0, 4.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.34326171875, -0.3319969177246094, -0.32073211669921875, -0.3094673156738281, -0.2982025146484375, -0.2869377136230469, -0.27567291259765625, -0.2644081115722656, -0.253143310546875, -0.24187850952148438, -0.23061370849609375, -0.21934890747070312, -0.2080841064453125, -0.19681930541992188, -0.18555450439453125, -0.17428970336914062, -0.16302490234375, -0.15176010131835938, -0.14049530029296875, -0.12923049926757812, -0.1179656982421875, -0.10670089721679688, -0.09543609619140625, -0.08417129516601562, -0.072906494140625, -0.061641693115234375, -0.05037689208984375, -0.039112091064453125, -0.0278472900390625, -0.016582489013671875, -0.00531768798828125, 0.005947113037109375, 0.0172119140625, 0.028476715087890625, 0.03974151611328125, 0.051006317138671875, 0.0622711181640625, 0.07353591918945312, 0.08480072021484375, 0.09606552124023438, 0.107330322265625, 0.11859512329101562, 0.12985992431640625, 0.14112472534179688, 0.1523895263671875, 0.16365432739257812, 0.17491912841796875, 0.18618392944335938, 0.19744873046875, 0.20871353149414062, 0.21997833251953125, 0.23124313354492188, 0.2425079345703125, 0.2537727355957031, 0.26503753662109375, 0.2763023376464844, 0.287567138671875, 0.2988319396972656, 0.31009674072265625, 0.3213615417480469, 0.3326263427734375, 0.3438911437988281, 0.35515594482421875, 0.3664207458496094, 0.377685546875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 6.0, 3.0, 4.0, 5.0, 4.0, 10.0, 11.0, 17.0, 13.0, 8.0, 17.0, 14.0, 19.0, 15.0, 25.0, 34.0, 35.0, 27.0, 32.0, 32.0, 47.0, 64.0, 34.0, 37.0, 41.0, 40.0, 36.0, 32.0, 37.0, 41.0, 35.0, 35.0, 23.0, 19.0, 31.0, 20.0, 20.0, 9.0, 16.0, 10.0, 5.0, 7.0, 6.0, 5.0, 4.0, 0.0, 4.0, 4.0, 4.0, 6.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0], "bins": [-0.259765625, -0.25160980224609375, -0.2434539794921875, -0.23529815673828125, -0.227142333984375, -0.21898651123046875, -0.2108306884765625, -0.20267486572265625, -0.19451904296875, -0.18636322021484375, -0.1782073974609375, -0.17005157470703125, -0.161895751953125, -0.15373992919921875, -0.1455841064453125, -0.13742828369140625, -0.1292724609375, -0.12111663818359375, -0.1129608154296875, -0.10480499267578125, -0.096649169921875, -0.08849334716796875, -0.0803375244140625, -0.07218170166015625, -0.06402587890625, -0.05587005615234375, -0.0477142333984375, -0.03955841064453125, -0.031402587890625, -0.02324676513671875, -0.0150909423828125, -0.00693511962890625, 0.001220703125, 0.00937652587890625, 0.0175323486328125, 0.02568817138671875, 0.033843994140625, 0.04199981689453125, 0.0501556396484375, 0.05831146240234375, 0.06646728515625, 0.07462310791015625, 0.0827789306640625, 0.09093475341796875, 0.099090576171875, 0.10724639892578125, 0.1154022216796875, 0.12355804443359375, 0.1317138671875, 0.13986968994140625, 0.1480255126953125, 0.15618133544921875, 0.164337158203125, 0.17249298095703125, 0.1806488037109375, 0.18880462646484375, 0.19696044921875, 0.20511627197265625, 0.2132720947265625, 0.22142791748046875, 0.229583740234375, 0.23773956298828125, 0.2458953857421875, 0.25405120849609375, 0.26220703125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 3.0, 3.0, 1.0, 0.0, 8.0, 5.0, 6.0, 10.0, 14.0, 19.0, 29.0, 47.0, 51.0, 99.0, 138.0, 278.0, 472.0, 910.0, 2102.0, 4925.0, 14174.0, 50733.0, 235469.0, 520473.0, 163395.0, 36662.0, 11077.0, 3899.0, 1678.0, 830.0, 410.0, 211.0, 128.0, 101.0, 64.0, 47.0, 19.0, 22.0, 24.0, 11.0, 4.0, 5.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.2061767578125, -0.20000076293945312, -0.19382476806640625, -0.18764877319335938, -0.1814727783203125, -0.17529678344726562, -0.16912078857421875, -0.16294479370117188, -0.156768798828125, -0.15059280395507812, -0.14441680908203125, -0.13824081420898438, -0.1320648193359375, -0.12588882446289062, -0.11971282958984375, -0.11353683471679688, -0.10736083984375, -0.10118484497070312, -0.09500885009765625, -0.08883285522460938, -0.0826568603515625, -0.07648086547851562, -0.07030487060546875, -0.06412887573242188, -0.057952880859375, -0.051776885986328125, -0.04560089111328125, -0.039424896240234375, -0.0332489013671875, -0.027072906494140625, -0.02089691162109375, -0.014720916748046875, -0.008544921875, -0.002368927001953125, 0.00380706787109375, 0.009983062744140625, 0.0161590576171875, 0.022335052490234375, 0.02851104736328125, 0.034687042236328125, 0.040863037109375, 0.047039031982421875, 0.05321502685546875, 0.059391021728515625, 0.0655670166015625, 0.07174301147460938, 0.07791900634765625, 0.08409500122070312, 0.09027099609375, 0.09644699096679688, 0.10262298583984375, 0.10879898071289062, 0.1149749755859375, 0.12115097045898438, 0.12732696533203125, 0.13350296020507812, 0.139678955078125, 0.14585494995117188, 0.15203094482421875, 0.15820693969726562, 0.1643829345703125, 0.17055892944335938, 0.17673492431640625, 0.18291091918945312, 0.1890869140625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 3.0, 6.0, 6.0, 11.0, 11.0, 22.0, 22.0, 22.0, 30.0, 36.0, 45.0, 47.0, 69.0, 68.0, 101.0, 75.0, 65.0, 74.0, 59.0, 58.0, 36.0, 31.0, 27.0, 14.0, 12.0, 18.0, 6.0, 4.0, 8.0, 5.0, 5.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.00013530254364013672, -0.00013203732669353485, -0.00012877210974693298, -0.00012550689280033112, -0.00012224167585372925, -0.00011897645890712738, -0.00011571124196052551, -0.00011244602501392365, -0.00010918080806732178, -0.00010591559112071991, -0.00010265037417411804, -9.938515722751617e-05, -9.61199402809143e-05, -9.285472333431244e-05, -8.958950638771057e-05, -8.63242894411087e-05, -8.305907249450684e-05, -7.979385554790497e-05, -7.65286386013031e-05, -7.326342165470123e-05, -6.999820470809937e-05, -6.67329877614975e-05, -6.346777081489563e-05, -6.020255386829376e-05, -5.6937336921691895e-05, -5.367211997509003e-05, -5.040690302848816e-05, -4.714168608188629e-05, -4.3876469135284424e-05, -4.0611252188682556e-05, -3.734603524208069e-05, -3.408081829547882e-05, -3.081560134887695e-05, -2.7550384402275085e-05, -2.4285167455673218e-05, -2.101995050907135e-05, -1.7754733562469482e-05, -1.4489516615867615e-05, -1.1224299669265747e-05, -7.95908272266388e-06, -4.693865776062012e-06, -1.428648829460144e-06, 1.8365681171417236e-06, 5.101785063743591e-06, 8.367002010345459e-06, 1.1632218956947327e-05, 1.4897435903549194e-05, 1.8162652850151062e-05, 2.142786979675293e-05, 2.4693086743354797e-05, 2.7958303689956665e-05, 3.122352063655853e-05, 3.44887375831604e-05, 3.775395452976227e-05, 4.1019171476364136e-05, 4.4284388422966003e-05, 4.754960536956787e-05, 5.081482231616974e-05, 5.4080039262771606e-05, 5.7345256209373474e-05, 6.061047315597534e-05, 6.387569010257721e-05, 6.714090704917908e-05, 7.040612399578094e-05, 7.367134094238281e-05]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 5.0, 2.0, 8.0, 17.0, 21.0, 39.0, 60.0, 121.0, 212.0, 454.0, 977.0, 2808.0, 10327.0, 67183.0, 585954.0, 335503.0, 34893.0, 6425.0, 2028.0, 740.0, 377.0, 164.0, 86.0, 67.0, 30.0, 17.0, 20.0, 10.0, 5.0, 0.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.276611328125, -0.26702117919921875, -0.2574310302734375, -0.24784088134765625, -0.238250732421875, -0.22866058349609375, -0.2190704345703125, -0.20948028564453125, -0.19989013671875, -0.19029998779296875, -0.1807098388671875, -0.17111968994140625, -0.161529541015625, -0.15193939208984375, -0.1423492431640625, -0.13275909423828125, -0.1231689453125, -0.11357879638671875, -0.1039886474609375, -0.09439849853515625, -0.084808349609375, -0.07521820068359375, -0.0656280517578125, -0.05603790283203125, -0.04644775390625, -0.03685760498046875, -0.0272674560546875, -0.01767730712890625, -0.008087158203125, 0.00150299072265625, 0.0110931396484375, 0.02068328857421875, 0.0302734375, 0.03986358642578125, 0.0494537353515625, 0.05904388427734375, 0.068634033203125, 0.07822418212890625, 0.0878143310546875, 0.09740447998046875, 0.10699462890625, 0.11658477783203125, 0.1261749267578125, 0.13576507568359375, 0.145355224609375, 0.15494537353515625, 0.1645355224609375, 0.17412567138671875, 0.1837158203125, 0.19330596923828125, 0.2028961181640625, 0.21248626708984375, 0.222076416015625, 0.23166656494140625, 0.2412567138671875, 0.25084686279296875, 0.26043701171875, 0.27002716064453125, 0.2796173095703125, 0.28920745849609375, 0.298797607421875, 0.30838775634765625, 0.3179779052734375, 0.32756805419921875, 0.337158203125]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 3.0, 0.0, 3.0, 3.0, 5.0, 7.0, 10.0, 13.0, 12.0, 14.0, 38.0, 37.0, 32.0, 50.0, 58.0, 54.0, 65.0, 72.0, 79.0, 78.0, 62.0, 47.0, 42.0, 38.0, 37.0, 40.0, 22.0, 19.0, 19.0, 9.0, 7.0, 9.0, 7.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.142578125, -0.13773155212402344, -0.13288497924804688, -0.1280384063720703, -0.12319183349609375, -0.11834526062011719, -0.11349868774414062, -0.10865211486816406, -0.1038055419921875, -0.09895896911621094, -0.09411239624023438, -0.08926582336425781, -0.08441925048828125, -0.07957267761230469, -0.07472610473632812, -0.06987953186035156, -0.065032958984375, -0.06018638610839844, -0.055339813232421875, -0.05049324035644531, -0.04564666748046875, -0.04080009460449219, -0.035953521728515625, -0.031106948852539062, -0.0262603759765625, -0.021413803100585938, -0.016567230224609375, -0.011720657348632812, -0.00687408447265625, -0.0020275115966796875, 0.002819061279296875, 0.0076656341552734375, 0.01251220703125, 0.017358779907226562, 0.022205352783203125, 0.027051925659179688, 0.03189849853515625, 0.03674507141113281, 0.041591644287109375, 0.04643821716308594, 0.0512847900390625, 0.05613136291503906, 0.060977935791015625, 0.06582450866699219, 0.07067108154296875, 0.07551765441894531, 0.08036422729492188, 0.08521080017089844, 0.090057373046875, 0.09490394592285156, 0.09975051879882812, 0.10459709167480469, 0.10944366455078125, 0.11429023742675781, 0.11913681030273438, 0.12398338317871094, 0.1288299560546875, 0.13367652893066406, 0.13852310180664062, 0.1433696746826172, 0.14821624755859375, 0.1530628204345703, 0.15790939331054688, 0.16275596618652344, 0.1676025390625]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 7.0, 15.0, 34.0, 66.0, 89.0, 147.0, 153.0, 151.0, 114.0, 104.0, 54.0, 33.0, 21.0, 9.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.354488372802734, -4.259562015533447, -4.164635181427002, -4.069708824157715, -3.9747822284698486, -3.8798556327819824, -3.7849292755126953, -3.690002679824829, -3.595076084136963, -3.5001494884490967, -3.4052228927612305, -3.3102965354919434, -3.215369939804077, -3.120443344116211, -3.025516986846924, -2.9305903911590576, -2.8356637954711914, -2.740737199783325, -2.645810604095459, -2.550884246826172, -2.4559576511383057, -2.3610310554504395, -2.2661046981811523, -2.171178102493286, -2.07625150680542, -1.9813249111175537, -1.886398434638977, -1.7914719581604004, -1.6965453624725342, -1.601618766784668, -1.5066922903060913, -1.4117658138275146, -1.3168392181396484, -1.2219126224517822, -1.1269861459732056, -1.032059669494629, -0.9371330738067627, -0.8422065377235413, -0.7472800016403198, -0.6523534655570984, -0.557426929473877, -0.4625003933906555, -0.3675738573074341, -0.27264732122421265, -0.1777207851409912, -0.08279424905776978, 0.01213228702545166, 0.1070588231086731, 0.20198535919189453, 0.29691189527511597, 0.3918384313583374, 0.48676496744155884, 0.5816915035247803, 0.6766180396080017, 0.7715445756912231, 0.8664711117744446, 0.961397647857666, 1.0563242435455322, 1.1512507200241089, 1.2461771965026855, 1.3411037921905518, 1.436030387878418, 1.5309568643569946, 1.6258833408355713, 1.7208099365234375]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 7.0, 2.0, 5.0, 6.0, 8.0, 11.0, 8.0, 16.0, 19.0, 14.0, 16.0, 22.0, 19.0, 34.0, 33.0, 31.0, 42.0, 45.0, 40.0, 37.0, 35.0, 41.0, 49.0, 43.0, 52.0, 45.0, 49.0, 17.0, 42.0, 39.0, 30.0, 23.0, 30.0, 21.0, 14.0, 8.0, 19.0, 11.0, 6.0, 9.0, 1.0, 7.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-1.801051139831543, -1.7524038553237915, -1.70375657081604, -1.6551092863082886, -1.606462001800537, -1.5578147172927856, -1.5091674327850342, -1.4605201482772827, -1.4118728637695312, -1.3632255792617798, -1.3145782947540283, -1.2659310102462769, -1.2172837257385254, -1.168636441230774, -1.1199891567230225, -1.071341872215271, -1.0226945877075195, -0.9740473031997681, -0.9254000186920166, -0.8767527341842651, -0.8281054496765137, -0.7794581651687622, -0.7308108806610107, -0.6821635961532593, -0.6335163116455078, -0.5848690271377563, -0.5362217426300049, -0.4875744581222534, -0.43892717361450195, -0.3902798891067505, -0.341632604598999, -0.29298532009124756, -0.2443380355834961, -0.19569075107574463, -0.14704346656799316, -0.0983961820602417, -0.049748897552490234, -0.0011016130447387695, 0.047545671463012695, 0.09619295597076416, 0.14484024047851562, 0.1934875249862671, 0.24213480949401855, 0.29078209400177, 0.3394293785095215, 0.38807666301727295, 0.4367239475250244, 0.4853712320327759, 0.5340185165405273, 0.5826658010482788, 0.6313130855560303, 0.6799603700637817, 0.7286076545715332, 0.7772549390792847, 0.8259022235870361, 0.8745495080947876, 0.9231967926025391, 0.9718440771102905, 1.020491361618042, 1.0691386461257935, 1.117785930633545, 1.1664332151412964, 1.2150804996490479, 1.2637277841567993, 1.3123750686645508]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 4.0, 4.0, 4.0, 3.0, 8.0, 15.0, 12.0, 17.0, 26.0, 34.0, 35.0, 58.0, 86.0, 111.0, 175.0, 232.0, 352.0, 514.0, 856.0, 1501.0, 2784.0, 6055.0, 16555.0, 73295.0, 3850210.0, 195044.0, 28645.0, 8953.0, 3733.0, 1930.0, 1070.0, 674.0, 410.0, 274.0, 185.0, 102.0, 84.0, 63.0, 53.0, 25.0, 23.0, 19.0, 13.0, 17.0, 6.0, 10.0, 6.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.345947265625, -0.3353691101074219, -0.32479095458984375, -0.3142127990722656, -0.3036346435546875, -0.2930564880371094, -0.28247833251953125, -0.2719001770019531, -0.261322021484375, -0.2507438659667969, -0.24016571044921875, -0.22958755493164062, -0.2190093994140625, -0.20843124389648438, -0.19785308837890625, -0.18727493286132812, -0.17669677734375, -0.16611862182617188, -0.15554046630859375, -0.14496231079101562, -0.1343841552734375, -0.12380599975585938, -0.11322784423828125, -0.10264968872070312, -0.092071533203125, -0.08149337768554688, -0.07091522216796875, -0.060337066650390625, -0.0497589111328125, -0.039180755615234375, -0.02860260009765625, -0.018024444580078125, -0.0074462890625, 0.003131866455078125, 0.01371002197265625, 0.024288177490234375, 0.0348663330078125, 0.045444488525390625, 0.05602264404296875, 0.06660079956054688, 0.077178955078125, 0.08775711059570312, 0.09833526611328125, 0.10891342163085938, 0.1194915771484375, 0.13006973266601562, 0.14064788818359375, 0.15122604370117188, 0.16180419921875, 0.17238235473632812, 0.18296051025390625, 0.19353866577148438, 0.2041168212890625, 0.21469497680664062, 0.22527313232421875, 0.23585128784179688, 0.246429443359375, 0.2570075988769531, 0.26758575439453125, 0.2781639099121094, 0.2887420654296875, 0.2993202209472656, 0.30989837646484375, 0.3204765319824219, 0.3310546875]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 0.0, 4.0, 1.0, 4.0, 3.0, 7.0, 10.0, 6.0, 12.0, 9.0, 26.0, 17.0, 17.0, 23.0, 33.0, 26.0, 27.0, 37.0, 38.0, 40.0, 38.0, 47.0, 48.0, 37.0, 35.0, 45.0, 40.0, 43.0, 38.0, 40.0, 34.0, 26.0, 38.0, 25.0, 27.0, 16.0, 15.0, 15.0, 9.0, 10.0, 11.0, 5.0, 4.0, 2.0, 5.0, 5.0, 1.0, 7.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.056732177734375, -0.05499982833862305, -0.053267478942871094, -0.05153512954711914, -0.04980278015136719, -0.048070430755615234, -0.04633808135986328, -0.04460573196411133, -0.042873382568359375, -0.04114103317260742, -0.03940868377685547, -0.037676334381103516, -0.03594398498535156, -0.03421163558959961, -0.032479286193847656, -0.030746936798095703, -0.02901458740234375, -0.027282238006591797, -0.025549888610839844, -0.02381753921508789, -0.022085189819335938, -0.020352840423583984, -0.01862049102783203, -0.016888141632080078, -0.015155792236328125, -0.013423442840576172, -0.011691093444824219, -0.009958744049072266, -0.008226394653320312, -0.006494045257568359, -0.004761695861816406, -0.003029346466064453, -0.0012969970703125, 0.0004353523254394531, 0.0021677017211914062, 0.0039000511169433594, 0.0056324005126953125, 0.007364749908447266, 0.009097099304199219, 0.010829448699951172, 0.012561798095703125, 0.014294147491455078, 0.01602649688720703, 0.017758846282958984, 0.019491195678710938, 0.02122354507446289, 0.022955894470214844, 0.024688243865966797, 0.02642059326171875, 0.028152942657470703, 0.029885292053222656, 0.03161764144897461, 0.03334999084472656, 0.035082340240478516, 0.03681468963623047, 0.03854703903198242, 0.040279388427734375, 0.04201173782348633, 0.04374408721923828, 0.045476436614990234, 0.04720878601074219, 0.04894113540649414, 0.050673484802246094, 0.05240583419799805, 0.05413818359375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 0.0, 5.0, 7.0, 7.0, 7.0, 15.0, 9.0, 11.0, 22.0, 25.0, 14.0, 39.0, 39.0, 69.0, 68.0, 101.0, 112.0, 147.0, 209.0, 299.0, 476.0, 907.0, 2626.0, 14169.0, 3333964.0, 822629.0, 13377.0, 2454.0, 876.0, 481.0, 274.0, 205.0, 127.0, 103.0, 97.0, 74.0, 54.0, 42.0, 34.0, 32.0, 20.0, 14.0, 10.0, 16.0, 5.0, 5.0, 0.0, 3.0, 6.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.1728515625, -1.1361846923828125, -1.099517822265625, -1.0628509521484375, -1.02618408203125, -0.9895172119140625, -0.952850341796875, -0.9161834716796875, -0.8795166015625, -0.8428497314453125, -0.806182861328125, -0.7695159912109375, -0.73284912109375, -0.6961822509765625, -0.659515380859375, -0.6228485107421875, -0.586181640625, -0.5495147705078125, -0.512847900390625, -0.4761810302734375, -0.43951416015625, -0.4028472900390625, -0.366180419921875, -0.3295135498046875, -0.2928466796875, -0.2561798095703125, -0.219512939453125, -0.1828460693359375, -0.14617919921875, -0.1095123291015625, -0.072845458984375, -0.0361785888671875, 0.00048828125, 0.0371551513671875, 0.073822021484375, 0.1104888916015625, 0.14715576171875, 0.1838226318359375, 0.220489501953125, 0.2571563720703125, 0.2938232421875, 0.3304901123046875, 0.367156982421875, 0.4038238525390625, 0.44049072265625, 0.4771575927734375, 0.513824462890625, 0.5504913330078125, 0.587158203125, 0.6238250732421875, 0.660491943359375, 0.6971588134765625, 0.73382568359375, 0.7704925537109375, 0.807159423828125, 0.8438262939453125, 0.8804931640625, 0.9171600341796875, 0.953826904296875, 0.9904937744140625, 1.02716064453125, 1.0638275146484375, 1.100494384765625, 1.1371612548828125, 1.173828125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 6.0, 18.0, 55.0, 145.0, 3531.0, 215.0, 75.0, 14.0, 7.0, 5.0, 7.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.324951171875, -0.31607818603515625, -0.3072052001953125, -0.29833221435546875, -0.289459228515625, -0.28058624267578125, -0.2717132568359375, -0.26284027099609375, -0.25396728515625, -0.24509429931640625, -0.2362213134765625, -0.22734832763671875, -0.218475341796875, -0.20960235595703125, -0.2007293701171875, -0.19185638427734375, -0.1829833984375, -0.17411041259765625, -0.1652374267578125, -0.15636444091796875, -0.147491455078125, -0.13861846923828125, -0.1297454833984375, -0.12087249755859375, -0.11199951171875, -0.10312652587890625, -0.0942535400390625, -0.08538055419921875, -0.076507568359375, -0.06763458251953125, -0.0587615966796875, -0.04988861083984375, -0.041015625, -0.03214263916015625, -0.0232696533203125, -0.01439666748046875, -0.005523681640625, 0.00334930419921875, 0.0122222900390625, 0.02109527587890625, 0.02996826171875, 0.03884124755859375, 0.0477142333984375, 0.05658721923828125, 0.065460205078125, 0.07433319091796875, 0.0832061767578125, 0.09207916259765625, 0.1009521484375, 0.10982513427734375, 0.1186981201171875, 0.12757110595703125, 0.136444091796875, 0.14531707763671875, 0.1541900634765625, 0.16306304931640625, 0.17193603515625, 0.18080902099609375, 0.1896820068359375, 0.19855499267578125, 0.207427978515625, 0.21630096435546875, 0.2251739501953125, 0.23404693603515625, 0.242919921875]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 2.0, 6.0, 1.0, 5.0, 14.0, 11.0, 15.0, 12.0, 30.0, 32.0, 27.0, 41.0, 60.0, 49.0, 55.0, 60.0, 73.0, 84.0, 72.0, 81.0, 59.0, 51.0, 44.0, 38.0, 21.0, 14.0, 15.0, 11.0, 4.0, 5.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.4650503396987915, -0.45184797048568726, -0.438645601272583, -0.42544323205947876, -0.4122408628463745, -0.39903849363327026, -0.385836124420166, -0.37263375520706177, -0.3594313859939575, -0.34622901678085327, -0.333026647567749, -0.3198242783546448, -0.3066219091415405, -0.2934195399284363, -0.28021717071533203, -0.2670148015022278, -0.2538124620914459, -0.24061009287834167, -0.22740772366523743, -0.21420535445213318, -0.20100298523902893, -0.18780061602592468, -0.17459826171398163, -0.16139589250087738, -0.14819352328777313, -0.13499115407466888, -0.12178878486156464, -0.10858642309904099, -0.09538405388593674, -0.08218168467283249, -0.06897932291030884, -0.05577695369720459, -0.04257461428642273, -0.02937224693596363, -0.016169879585504532, -0.0029675140976905823, 0.010234855115413666, 0.023437224328517914, 0.036639586091041565, 0.04984195530414581, 0.06304432451725006, 0.07624669373035431, 0.08944906294345856, 0.10265142470598221, 0.11585379391908646, 0.1290561556816101, 0.14225852489471436, 0.1554608941078186, 0.16866326332092285, 0.1818656325340271, 0.19506800174713135, 0.2082703709602356, 0.22147274017333984, 0.2346751093864441, 0.24787746369838715, 0.2610798478126526, 0.27428221702575684, 0.2874845862388611, 0.30068695545196533, 0.3138893246650696, 0.32709169387817383, 0.3402940630912781, 0.3534964323043823, 0.3666988015174866, 0.37990114092826843]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 6.0, 6.0, 8.0, 5.0, 7.0, 6.0, 5.0, 3.0, 17.0, 17.0, 17.0, 28.0, 13.0, 26.0, 29.0, 22.0, 41.0, 22.0, 43.0, 35.0, 28.0, 37.0, 52.0, 49.0, 31.0, 45.0, 36.0, 33.0, 27.0, 28.0, 36.0, 28.0, 31.0, 30.0, 23.0, 21.0, 21.0, 18.0, 13.0, 14.0, 11.0, 5.0, 10.0, 5.0, 1.0, 5.0, 6.0, 4.0, 1.0, 0.0, 2.0, 3.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.28381919860839844, -0.27472493052482605, -0.2656306326389313, -0.2565363645553589, -0.2474420815706253, -0.23834779858589172, -0.22925351560115814, -0.22015923261642456, -0.21106496453285217, -0.2019706815481186, -0.192876398563385, -0.18378213047981262, -0.17468784749507904, -0.16559356451034546, -0.15649928152561188, -0.1474049985408783, -0.13831071555614471, -0.12921643257141113, -0.12012215703725815, -0.11102787405252457, -0.10193359851837158, -0.092839315533638, -0.08374503254890442, -0.07465075701475143, -0.06555647403001785, -0.05646219477057457, -0.04736791551113129, -0.038273632526397705, -0.029179353266954422, -0.02008507400751114, -0.010990791022777557, -0.0018965154886245728, 0.007197767496109009, 0.016292046755552292, 0.025386327877640724, 0.034480608999729156, 0.04357488825917244, 0.05266916751861572, 0.061763450503349304, 0.07085772603750229, 0.07995200902223587, 0.08904629200696945, 0.09814056754112244, 0.10723485052585602, 0.1163291335105896, 0.125423401594162, 0.13451769948005676, 0.14361196756362915, 0.15270625054836273, 0.1618005335330963, 0.1708948165178299, 0.17998909950256348, 0.18908336758613586, 0.19817765057086945, 0.20727193355560303, 0.21636620163917542, 0.2254604995250702, 0.23455478250980377, 0.24364906549453735, 0.25274333357810974, 0.2618376314640045, 0.2709318995475769, 0.2800261974334717, 0.28912046551704407, 0.29821473360061646]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 4.0, 0.0, 4.0, 2.0, 3.0, 4.0, 6.0, 10.0, 11.0, 10.0, 23.0, 29.0, 38.0, 55.0, 90.0, 120.0, 190.0, 280.0, 428.0, 767.0, 1364.0, 2317.0, 4051.0, 7461.0, 14587.0, 28149.0, 53559.0, 100001.0, 169833.0, 220350.0, 189426.0, 118408.0, 64776.0, 33957.0, 17533.0, 9174.0, 4849.0, 2663.0, 1553.0, 900.0, 522.0, 317.0, 219.0, 145.0, 117.0, 65.0, 54.0, 45.0, 25.0, 11.0, 12.0, 15.0, 10.0, 9.0, 12.0, 5.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.169677734375, -0.16463470458984375, -0.1595916748046875, -0.15454864501953125, -0.149505615234375, -0.14446258544921875, -0.1394195556640625, -0.13437652587890625, -0.12933349609375, -0.12429046630859375, -0.1192474365234375, -0.11420440673828125, -0.109161376953125, -0.10411834716796875, -0.0990753173828125, -0.09403228759765625, -0.0889892578125, -0.08394622802734375, -0.0789031982421875, -0.07386016845703125, -0.068817138671875, -0.06377410888671875, -0.0587310791015625, -0.05368804931640625, -0.04864501953125, -0.04360198974609375, -0.0385589599609375, -0.03351593017578125, -0.028472900390625, -0.02342987060546875, -0.0183868408203125, -0.01334381103515625, -0.00830078125, -0.00325775146484375, 0.0017852783203125, 0.00682830810546875, 0.011871337890625, 0.01691436767578125, 0.0219573974609375, 0.02700042724609375, 0.03204345703125, 0.03708648681640625, 0.0421295166015625, 0.04717254638671875, 0.052215576171875, 0.05725860595703125, 0.0623016357421875, 0.06734466552734375, 0.0723876953125, 0.07743072509765625, 0.0824737548828125, 0.08751678466796875, 0.092559814453125, 0.09760284423828125, 0.1026458740234375, 0.10768890380859375, 0.11273193359375, 0.11777496337890625, 0.1228179931640625, 0.12786102294921875, 0.132904052734375, 0.13794708251953125, 0.1429901123046875, 0.14803314208984375, 0.153076171875]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 5.0, 7.0, 8.0, 9.0, 4.0, 17.0, 14.0, 17.0, 20.0, 32.0, 30.0, 18.0, 18.0, 30.0, 29.0, 42.0, 30.0, 33.0, 38.0, 41.0, 39.0, 40.0, 29.0, 35.0, 37.0, 45.0, 43.0, 39.0, 37.0, 35.0, 18.0, 20.0, 20.0, 19.0, 13.0, 10.0, 8.0, 10.0, 14.0, 11.0, 7.0, 5.0, 7.0, 5.0, 5.0, 3.0, 5.0, 2.0, 2.0], "bins": [-0.0733642578125, -0.07134199142456055, -0.0693197250366211, -0.06729745864868164, -0.06527519226074219, -0.06325292587280273, -0.06123065948486328, -0.05920839309692383, -0.057186126708984375, -0.05516386032104492, -0.05314159393310547, -0.051119327545166016, -0.04909706115722656, -0.04707479476928711, -0.045052528381347656, -0.0430302619934082, -0.04100799560546875, -0.0389857292175293, -0.036963462829589844, -0.03494119644165039, -0.03291893005371094, -0.030896663665771484, -0.02887439727783203, -0.026852130889892578, -0.024829864501953125, -0.022807598114013672, -0.02078533172607422, -0.018763065338134766, -0.016740798950195312, -0.01471853256225586, -0.012696266174316406, -0.010673999786376953, -0.0086517333984375, -0.006629467010498047, -0.004607200622558594, -0.0025849342346191406, -0.0005626678466796875, 0.0014595985412597656, 0.0034818649291992188, 0.005504131317138672, 0.007526397705078125, 0.009548664093017578, 0.011570930480957031, 0.013593196868896484, 0.015615463256835938, 0.01763772964477539, 0.019659996032714844, 0.021682262420654297, 0.02370452880859375, 0.025726795196533203, 0.027749061584472656, 0.02977132797241211, 0.03179359436035156, 0.033815860748291016, 0.03583812713623047, 0.03786039352416992, 0.039882659912109375, 0.04190492630004883, 0.04392719268798828, 0.045949459075927734, 0.04797172546386719, 0.04999399185180664, 0.052016258239746094, 0.05403852462768555, 0.056060791015625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 4.0, 5.0, 14.0, 10.0, 23.0, 16.0, 22.0, 37.0, 61.0, 81.0, 99.0, 170.0, 255.0, 334.0, 541.0, 926.0, 1659.0, 3547.0, 10626.0, 46415.0, 263549.0, 559475.0, 124649.0, 23907.0, 6330.0, 2476.0, 1233.0, 692.0, 458.0, 286.0, 205.0, 121.0, 86.0, 77.0, 51.0, 34.0, 22.0, 17.0, 11.0, 8.0, 10.0, 2.0, 5.0, 3.0, 1.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.4501953125, -0.4362525939941406, -0.42230987548828125, -0.4083671569824219, -0.3944244384765625, -0.3804817199707031, -0.36653900146484375, -0.3525962829589844, -0.338653564453125, -0.3247108459472656, -0.31076812744140625, -0.2968254089355469, -0.2828826904296875, -0.2689399719238281, -0.25499725341796875, -0.24105453491210938, -0.22711181640625, -0.21316909790039062, -0.19922637939453125, -0.18528366088867188, -0.1713409423828125, -0.15739822387695312, -0.14345550537109375, -0.12951278686523438, -0.115570068359375, -0.10162734985351562, -0.08768463134765625, -0.07374191284179688, -0.0597991943359375, -0.045856475830078125, -0.03191375732421875, -0.017971038818359375, -0.0040283203125, 0.009914398193359375, 0.02385711669921875, 0.037799835205078125, 0.0517425537109375, 0.06568527221679688, 0.07962799072265625, 0.09357070922851562, 0.107513427734375, 0.12145614624023438, 0.13539886474609375, 0.14934158325195312, 0.1632843017578125, 0.17722702026367188, 0.19116973876953125, 0.20511245727539062, 0.21905517578125, 0.23299789428710938, 0.24694061279296875, 0.2608833312988281, 0.2748260498046875, 0.2887687683105469, 0.30271148681640625, 0.3166542053222656, 0.330596923828125, 0.3445396423339844, 0.35848236083984375, 0.3724250793457031, 0.3863677978515625, 0.4003105163574219, 0.41425323486328125, 0.4281959533691406, 0.442138671875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 2.0, 1.0, 2.0, 7.0, 4.0, 13.0, 9.0, 16.0, 11.0, 21.0, 19.0, 27.0, 19.0, 24.0, 33.0, 25.0, 40.0, 40.0, 44.0, 42.0, 45.0, 46.0, 41.0, 43.0, 44.0, 46.0, 33.0, 47.0, 32.0, 31.0, 34.0, 25.0, 22.0, 24.0, 17.0, 13.0, 9.0, 15.0, 12.0, 4.0, 3.0, 1.0, 4.0, 3.0, 5.0, 2.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.4150390625, -0.40302276611328125, -0.3910064697265625, -0.37899017333984375, -0.366973876953125, -0.35495758056640625, -0.3429412841796875, -0.33092498779296875, -0.31890869140625, -0.30689239501953125, -0.2948760986328125, -0.28285980224609375, -0.270843505859375, -0.25882720947265625, -0.2468109130859375, -0.23479461669921875, -0.2227783203125, -0.21076202392578125, -0.1987457275390625, -0.18672943115234375, -0.174713134765625, -0.16269683837890625, -0.1506805419921875, -0.13866424560546875, -0.12664794921875, -0.11463165283203125, -0.1026153564453125, -0.09059906005859375, -0.078582763671875, -0.06656646728515625, -0.0545501708984375, -0.04253387451171875, -0.030517578125, -0.01850128173828125, -0.0064849853515625, 0.00553131103515625, 0.017547607421875, 0.02956390380859375, 0.0415802001953125, 0.05359649658203125, 0.06561279296875, 0.07762908935546875, 0.0896453857421875, 0.10166168212890625, 0.113677978515625, 0.12569427490234375, 0.1377105712890625, 0.14972686767578125, 0.1617431640625, 0.17375946044921875, 0.1857757568359375, 0.19779205322265625, 0.209808349609375, 0.22182464599609375, 0.2338409423828125, 0.24585723876953125, 0.25787353515625, 0.26988983154296875, 0.2819061279296875, 0.29392242431640625, 0.305938720703125, 0.31795501708984375, 0.3299713134765625, 0.34198760986328125, 0.35400390625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 7.0, 8.0, 16.0, 16.0, 40.0, 79.0, 129.0, 262.0, 596.0, 1731.0, 6582.0, 45207.0, 715720.0, 254011.0, 18593.0, 3598.0, 1086.0, 406.0, 213.0, 109.0, 58.0, 30.0, 21.0, 11.0, 8.0, 10.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.6103515625, -0.5953903198242188, -0.5804290771484375, -0.5654678344726562, -0.550506591796875, -0.5355453491210938, -0.5205841064453125, -0.5056228637695312, -0.49066162109375, -0.47570037841796875, -0.4607391357421875, -0.44577789306640625, -0.430816650390625, -0.41585540771484375, -0.4008941650390625, -0.38593292236328125, -0.3709716796875, -0.35601043701171875, -0.3410491943359375, -0.32608795166015625, -0.311126708984375, -0.29616546630859375, -0.2812042236328125, -0.26624298095703125, -0.25128173828125, -0.23632049560546875, -0.2213592529296875, -0.20639801025390625, -0.191436767578125, -0.17647552490234375, -0.1615142822265625, -0.14655303955078125, -0.131591796875, -0.11663055419921875, -0.1016693115234375, -0.08670806884765625, -0.071746826171875, -0.05678558349609375, -0.0418243408203125, -0.02686309814453125, -0.01190185546875, 0.00305938720703125, 0.0180206298828125, 0.03298187255859375, 0.047943115234375, 0.06290435791015625, 0.0778656005859375, 0.09282684326171875, 0.1077880859375, 0.12274932861328125, 0.1377105712890625, 0.15267181396484375, 0.167633056640625, 0.18259429931640625, 0.1975555419921875, 0.21251678466796875, 0.22747802734375, 0.24243927001953125, 0.2574005126953125, 0.27236175537109375, 0.287322998046875, 0.30228424072265625, 0.3172454833984375, 0.33220672607421875, 0.34716796875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 5.0, 11.0, 12.0, 30.0, 27.0, 35.0, 45.0, 68.0, 65.0, 58.0, 95.0, 106.0, 79.0, 76.0, 68.0, 49.0, 45.0, 38.0, 27.0, 19.0, 10.0, 16.0, 7.0, 6.0, 2.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00012576580047607422, -0.00012165307998657227, -0.00011754035949707031, -0.00011342763900756836, -0.0001093149185180664, -0.00010520219802856445, -0.0001010894775390625, -9.697675704956055e-05, -9.28640365600586e-05, -8.875131607055664e-05, -8.463859558105469e-05, -8.052587509155273e-05, -7.641315460205078e-05, -7.230043411254883e-05, -6.818771362304688e-05, -6.407499313354492e-05, -5.996227264404297e-05, -5.5849552154541016e-05, -5.173683166503906e-05, -4.762411117553711e-05, -4.3511390686035156e-05, -3.93986701965332e-05, -3.528594970703125e-05, -3.11732292175293e-05, -2.7060508728027344e-05, -2.294778823852539e-05, -1.8835067749023438e-05, -1.4722347259521484e-05, -1.0609626770019531e-05, -6.496906280517578e-06, -2.384185791015625e-06, 1.7285346984863281e-06, 5.841255187988281e-06, 9.953975677490234e-06, 1.4066696166992188e-05, 1.817941665649414e-05, 2.2292137145996094e-05, 2.6404857635498047e-05, 3.0517578125e-05, 3.463029861450195e-05, 3.8743019104003906e-05, 4.285573959350586e-05, 4.696846008300781e-05, 5.1081180572509766e-05, 5.519390106201172e-05, 5.930662155151367e-05, 6.341934204101562e-05, 6.753206253051758e-05, 7.164478302001953e-05, 7.575750350952148e-05, 7.987022399902344e-05, 8.398294448852539e-05, 8.809566497802734e-05, 9.22083854675293e-05, 9.632110595703125e-05, 0.0001004338264465332, 0.00010454654693603516, 0.00010865926742553711, 0.00011277198791503906, 0.00011688470840454102, 0.00012099742889404297, 0.00012511014938354492, 0.00012922286987304688, 0.00013333559036254883, 0.00013744831085205078]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 4.0, 5.0, 7.0, 14.0, 9.0, 17.0, 28.0, 41.0, 55.0, 97.0, 128.0, 232.0, 459.0, 852.0, 2045.0, 5383.0, 18964.0, 121191.0, 683998.0, 179083.0, 24665.0, 6528.0, 2471.0, 1014.0, 518.0, 277.0, 153.0, 99.0, 84.0, 35.0, 32.0, 16.0, 10.0, 8.0, 9.0, 4.0, 7.0, 6.0, 3.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.30615234375, -0.296142578125, -0.2861328125, -0.276123046875, -0.26611328125, -0.256103515625, -0.24609375, -0.236083984375, -0.22607421875, -0.216064453125, -0.2060546875, -0.196044921875, -0.18603515625, -0.176025390625, -0.166015625, -0.156005859375, -0.14599609375, -0.135986328125, -0.1259765625, -0.115966796875, -0.10595703125, -0.095947265625, -0.0859375, -0.075927734375, -0.06591796875, -0.055908203125, -0.0458984375, -0.035888671875, -0.02587890625, -0.015869140625, -0.005859375, 0.004150390625, 0.01416015625, 0.024169921875, 0.0341796875, 0.044189453125, 0.05419921875, 0.064208984375, 0.07421875, 0.084228515625, 0.09423828125, 0.104248046875, 0.1142578125, 0.124267578125, 0.13427734375, 0.144287109375, 0.154296875, 0.164306640625, 0.17431640625, 0.184326171875, 0.1943359375, 0.204345703125, 0.21435546875, 0.224365234375, 0.234375, 0.244384765625, 0.25439453125, 0.264404296875, 0.2744140625, 0.284423828125, 0.29443359375, 0.304443359375, 0.314453125, 0.324462890625, 0.33447265625]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 1.0, 3.0, 1.0, 6.0, 6.0, 10.0, 6.0, 17.0, 25.0, 40.0, 69.0, 78.0, 90.0, 119.0, 116.0, 109.0, 103.0, 60.0, 45.0, 24.0, 30.0, 11.0, 11.0, 5.0, 6.0, 5.0, 7.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2083740234375, -0.1985607147216797, -0.18874740600585938, -0.17893409729003906, -0.16912078857421875, -0.15930747985839844, -0.14949417114257812, -0.1396808624267578, -0.1298675537109375, -0.12005424499511719, -0.11024093627929688, -0.10042762756347656, -0.09061431884765625, -0.08080101013183594, -0.07098770141601562, -0.06117439270019531, -0.051361083984375, -0.04154777526855469, -0.031734466552734375, -0.021921157836914062, -0.01210784912109375, -0.0022945404052734375, 0.007518768310546875, 0.017332077026367188, 0.0271453857421875, 0.03695869445800781, 0.046772003173828125, 0.05658531188964844, 0.06639862060546875, 0.07621192932128906, 0.08602523803710938, 0.09583854675292969, 0.10565185546875, 0.11546516418457031, 0.12527847290039062, 0.13509178161621094, 0.14490509033203125, 0.15471839904785156, 0.16453170776367188, 0.1743450164794922, 0.1841583251953125, 0.1939716339111328, 0.20378494262695312, 0.21359825134277344, 0.22341156005859375, 0.23322486877441406, 0.24303817749023438, 0.2528514862060547, 0.262664794921875, 0.2724781036376953, 0.2822914123535156, 0.29210472106933594, 0.30191802978515625, 0.31173133850097656, 0.3215446472167969, 0.3313579559326172, 0.3411712646484375, 0.3509845733642578, 0.3607978820800781, 0.37061119079589844, 0.38042449951171875, 0.39023780822753906, 0.4000511169433594, 0.4098644256591797, 0.419677734375]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 5.0, 20.0, 17.0, 38.0, 42.0, 82.0, 110.0, 156.0, 132.0, 110.0, 107.0, 74.0, 50.0, 26.0, 14.0, 8.0, 3.0, 3.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.134925603866577, -3.011815071105957, -2.888704299926758, -2.7655935287475586, -2.6424829959869385, -2.5193724632263184, -2.396261692047119, -2.27315092086792, -2.1500403881073, -2.0269298553466797, -1.9038190841674805, -1.7807084321975708, -1.6575977802276611, -1.5344871282577515, -1.4113764762878418, -1.2882658243179321, -1.1651551723480225, -1.0420445203781128, -0.9189338684082031, -0.7958232164382935, -0.6727125644683838, -0.5496019124984741, -0.42649126052856445, -0.3033806085586548, -0.18026995658874512, -0.05715930461883545, 0.06595134735107422, 0.1890619993209839, 0.31217265129089355, 0.4352833032608032, 0.5583939552307129, 0.6815046072006226, 0.8046150207519531, 0.9277256727218628, 1.0508363246917725, 1.1739469766616821, 1.2970576286315918, 1.4201682806015015, 1.5432789325714111, 1.6663895845413208, 1.7895002365112305, 1.9126108884811401, 2.03572154045105, 2.15883207321167, 2.281942844390869, 2.4050536155700684, 2.5281641483306885, 2.6512746810913086, 2.774385452270508, 2.897496223449707, 3.020606756210327, 3.1437172889709473, 3.2668280601501465, 3.3899388313293457, 3.513049364089966, 3.636159896850586, 3.759270668029785, 3.8823814392089844, 4.005492210388184, 4.128602504730225, 4.251713275909424, 4.374824047088623, 4.497934341430664, 4.621045112609863, 4.7441558837890625]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 6.0, 5.0, 13.0, 6.0, 11.0, 18.0, 14.0, 26.0, 18.0, 27.0, 27.0, 28.0, 23.0, 44.0, 49.0, 30.0, 41.0, 46.0, 48.0, 56.0, 47.0, 42.0, 38.0, 33.0, 33.0, 24.0, 39.0, 24.0, 29.0, 27.0, 21.0, 21.0, 12.0, 11.0, 9.0, 10.0, 10.0, 7.0, 4.0, 4.0, 4.0, 4.0, 7.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-2.234001636505127, -2.169093370437622, -2.104184865951538, -2.039276599884033, -1.9743683338165283, -1.9094599485397339, -1.8445515632629395, -1.7796432971954346, -1.7147350311279297, -1.6498266458511353, -1.5849183797836304, -1.520009994506836, -1.455101728439331, -1.3901933431625366, -1.3252849578857422, -1.2603766918182373, -1.1954683065414429, -1.1305599212646484, -1.0656516551971436, -1.0007432699203491, -0.9358350038528442, -0.8709266185760498, -0.8060182929039001, -0.7411099672317505, -0.6762016415596008, -0.6112933158874512, -0.5463849902153015, -0.48147663474082947, -0.4165683090686798, -0.35165998339653015, -0.2867516279220581, -0.22184330224990845, -0.1569349765777588, -0.09202664345502853, -0.02711831033229828, 0.03779003024101257, 0.10269835591316223, 0.1676066815853119, 0.23251503705978394, 0.2974233627319336, 0.36233168840408325, 0.4272400140762329, 0.49214833974838257, 0.5570566654205322, 0.6219650506973267, 0.6868733167648315, 0.751781702041626, 0.8166900277137756, 0.8815983533859253, 0.946506679058075, 1.0114150047302246, 1.076323390007019, 1.141231656074524, 1.2061400413513184, 1.2710483074188232, 1.3359566926956177, 1.400865077972412, 1.4657734632492065, 1.5306817293167114, 1.5955901145935059, 1.6604983806610107, 1.7254067659378052, 1.7903151512145996, 1.8552234172821045, 1.9201316833496094]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 6.0, 8.0, 8.0, 5.0, 22.0, 39.0, 51.0, 87.0, 171.0, 435.0, 1005.0, 2822.0, 10909.0, 143555.0, 4002162.0, 25521.0, 4897.0, 1538.0, 539.0, 245.0, 112.0, 59.0, 30.0, 22.0, 10.0, 11.0, 4.0, 3.0, 3.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.798828125, -0.771484375, -0.744140625, -0.716796875, -0.689453125, -0.662109375, -0.634765625, -0.607421875, -0.580078125, -0.552734375, -0.525390625, -0.498046875, -0.470703125, -0.443359375, -0.416015625, -0.388671875, -0.361328125, -0.333984375, -0.306640625, -0.279296875, -0.251953125, -0.224609375, -0.197265625, -0.169921875, -0.142578125, -0.115234375, -0.087890625, -0.060546875, -0.033203125, -0.005859375, 0.021484375, 0.048828125, 0.076171875, 0.103515625, 0.130859375, 0.158203125, 0.185546875, 0.212890625, 0.240234375, 0.267578125, 0.294921875, 0.322265625, 0.349609375, 0.376953125, 0.404296875, 0.431640625, 0.458984375, 0.486328125, 0.513671875, 0.541015625, 0.568359375, 0.595703125, 0.623046875, 0.650390625, 0.677734375, 0.705078125, 0.732421875, 0.759765625, 0.787109375, 0.814453125, 0.841796875, 0.869140625, 0.896484375, 0.923828125, 0.951171875]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 3.0, 9.0, 4.0, 8.0, 4.0, 10.0, 10.0, 20.0, 24.0, 23.0, 25.0, 33.0, 47.0, 38.0, 46.0, 48.0, 54.0, 50.0, 55.0, 56.0, 56.0, 53.0, 46.0, 43.0, 41.0, 32.0, 29.0, 29.0, 16.0, 18.0, 15.0, 12.0, 13.0, 8.0, 9.0, 7.0, 3.0, 2.0, 5.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0966796875, -0.09398174285888672, -0.09128379821777344, -0.08858585357666016, -0.08588790893554688, -0.0831899642944336, -0.08049201965332031, -0.07779407501220703, -0.07509613037109375, -0.07239818572998047, -0.06970024108886719, -0.0670022964477539, -0.06430435180664062, -0.061606407165527344, -0.05890846252441406, -0.05621051788330078, -0.0535125732421875, -0.05081462860107422, -0.04811668395996094, -0.045418739318847656, -0.042720794677734375, -0.040022850036621094, -0.03732490539550781, -0.03462696075439453, -0.03192901611328125, -0.02923107147216797, -0.026533126831054688, -0.023835182189941406, -0.021137237548828125, -0.018439292907714844, -0.015741348266601562, -0.013043403625488281, -0.010345458984375, -0.007647514343261719, -0.0049495697021484375, -0.0022516250610351562, 0.000446319580078125, 0.0031442642211914062, 0.0058422088623046875, 0.008540153503417969, 0.01123809814453125, 0.013936042785644531, 0.016633987426757812, 0.019331932067871094, 0.022029876708984375, 0.024727821350097656, 0.027425765991210938, 0.03012371063232422, 0.0328216552734375, 0.03551959991455078, 0.03821754455566406, 0.040915489196777344, 0.043613433837890625, 0.046311378479003906, 0.04900932312011719, 0.05170726776123047, 0.05440521240234375, 0.05710315704345703, 0.05980110168457031, 0.062499046325683594, 0.06519699096679688, 0.06789493560791016, 0.07059288024902344, 0.07329082489013672, 0.07598876953125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 5.0, 6.0, 8.0, 10.0, 10.0, 12.0, 14.0, 24.0, 30.0, 43.0, 89.0, 135.0, 214.0, 482.0, 1041.0, 2784.0, 9438.0, 64253.0, 4044680.0, 57224.0, 9078.0, 2623.0, 1007.0, 490.0, 208.0, 119.0, 70.0, 43.0, 31.0, 26.0, 16.0, 13.0, 17.0, 3.0, 10.0, 8.0, 6.0, 6.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.4541015625, -1.4163131713867188, -1.3785247802734375, -1.3407363891601562, -1.302947998046875, -1.2651596069335938, -1.2273712158203125, -1.1895828247070312, -1.15179443359375, -1.1140060424804688, -1.0762176513671875, -1.0384292602539062, -1.000640869140625, -0.9628524780273438, -0.9250640869140625, -0.8872756958007812, -0.8494873046875, -0.8116989135742188, -0.7739105224609375, -0.7361221313476562, -0.698333740234375, -0.6605453491210938, -0.6227569580078125, -0.5849685668945312, -0.54718017578125, -0.5093917846679688, -0.4716033935546875, -0.43381500244140625, -0.396026611328125, -0.35823822021484375, -0.3204498291015625, -0.28266143798828125, -0.244873046875, -0.20708465576171875, -0.1692962646484375, -0.13150787353515625, -0.093719482421875, -0.05593109130859375, -0.0181427001953125, 0.01964569091796875, 0.05743408203125, 0.09522247314453125, 0.1330108642578125, 0.17079925537109375, 0.208587646484375, 0.24637603759765625, 0.2841644287109375, 0.32195281982421875, 0.3597412109375, 0.39752960205078125, 0.4353179931640625, 0.47310638427734375, 0.510894775390625, 0.5486831665039062, 0.5864715576171875, 0.6242599487304688, 0.66204833984375, 0.6998367309570312, 0.7376251220703125, 0.7754135131835938, 0.813201904296875, 0.8509902954101562, 0.8887786865234375, 0.9265670776367188, 0.96435546875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 7.0, 18.0, 15.0, 23.0, 74.0, 235.0, 3250.0, 300.0, 63.0, 24.0, 30.0, 11.0, 6.0, 5.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.36962890625, -0.3613319396972656, -0.35303497314453125, -0.3447380065917969, -0.3364410400390625, -0.3281440734863281, -0.31984710693359375, -0.3115501403808594, -0.303253173828125, -0.2949562072753906, -0.28665924072265625, -0.2783622741699219, -0.2700653076171875, -0.2617683410644531, -0.25347137451171875, -0.24517440795898438, -0.23687744140625, -0.22858047485351562, -0.22028350830078125, -0.21198654174804688, -0.2036895751953125, -0.19539260864257812, -0.18709564208984375, -0.17879867553710938, -0.170501708984375, -0.16220474243164062, -0.15390777587890625, -0.14561080932617188, -0.1373138427734375, -0.12901687622070312, -0.12071990966796875, -0.11242294311523438, -0.1041259765625, -0.09582901000976562, -0.08753204345703125, -0.07923507690429688, -0.0709381103515625, -0.06264114379882812, -0.05434417724609375, -0.046047210693359375, -0.037750244140625, -0.029453277587890625, -0.02115631103515625, -0.012859344482421875, -0.0045623779296875, 0.003734588623046875, 0.01203155517578125, 0.020328521728515625, 0.02862548828125, 0.036922454833984375, 0.04521942138671875, 0.053516387939453125, 0.0618133544921875, 0.07011032104492188, 0.07840728759765625, 0.08670425415039062, 0.095001220703125, 0.10329818725585938, 0.11159515380859375, 0.11989212036132812, 0.1281890869140625, 0.13648605346679688, 0.14478302001953125, 0.15307998657226562, 0.161376953125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 2.0, 3.0, 3.0, 4.0, 4.0, 3.0, 10.0, 26.0, 25.0, 26.0, 37.0, 45.0, 60.0, 59.0, 75.0, 56.0, 76.0, 79.0, 66.0, 76.0, 55.0, 41.0, 30.0, 35.0, 27.0, 21.0, 24.0, 18.0, 9.0, 5.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.5710350275039673, -0.5541232228279114, -0.5372114181518555, -0.5202996730804443, -0.5033878684043884, -0.4864760637283325, -0.469564288854599, -0.4526525139808655, -0.43574070930480957, -0.41882890462875366, -0.40191712975502014, -0.3850053548812866, -0.3680935502052307, -0.3511817455291748, -0.3342699706554413, -0.31735819578170776, -0.30044639110565186, -0.28353458642959595, -0.2666228115558624, -0.2497110217809677, -0.232799232006073, -0.21588744223117828, -0.19897565245628357, -0.18206386268138885, -0.16515207290649414, -0.14824028313159943, -0.1313284933567047, -0.11441670358181, -0.09750491380691528, -0.08059312403202057, -0.06368133425712585, -0.04676954448223114, -0.0298578143119812, -0.012946024537086487, 0.0039657652378082275, 0.020877555012702942, 0.037789344787597656, 0.05470113456249237, 0.07161292433738708, 0.0885247141122818, 0.10543650388717651, 0.12234829366207123, 0.13926008343696594, 0.15617187321186066, 0.17308366298675537, 0.18999545276165009, 0.2069072425365448, 0.22381903231143951, 0.24073082208633423, 0.25764262676239014, 0.27455440163612366, 0.2914661765098572, 0.3083779811859131, 0.325289785861969, 0.3422015607357025, 0.35911333560943604, 0.37602514028549194, 0.39293694496154785, 0.40984871983528137, 0.4267604947090149, 0.4436722993850708, 0.4605841040611267, 0.47749587893486023, 0.49440765380859375, 0.5113194584846497]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [4.0, 0.0, 4.0, 4.0, 4.0, 1.0, 6.0, 4.0, 4.0, 8.0, 9.0, 3.0, 9.0, 10.0, 11.0, 18.0, 15.0, 17.0, 23.0, 29.0, 23.0, 29.0, 24.0, 34.0, 27.0, 44.0, 32.0, 37.0, 43.0, 43.0, 43.0, 39.0, 55.0, 41.0, 36.0, 25.0, 19.0, 22.0, 28.0, 26.0, 29.0, 26.0, 25.0, 16.0, 10.0, 11.0, 8.0, 7.0, 7.0, 6.0, 5.0, 3.0, 4.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3184284567832947, -0.3076654076576233, -0.2969023287296295, -0.28613927960395813, -0.27537623047828674, -0.26461315155029297, -0.2538501024246216, -0.243087038397789, -0.23232397437095642, -0.22156091034412384, -0.21079786121845245, -0.20003479719161987, -0.1892717331647873, -0.1785086691379547, -0.16774562001228333, -0.15698255598545074, -0.14621950685977936, -0.13545644283294678, -0.1246933862566948, -0.11393032968044281, -0.10316726565361023, -0.09240420907735825, -0.08164115250110626, -0.07087808847427368, -0.0601150318980217, -0.049351971596479416, -0.038588911294937134, -0.02782585471868515, -0.017062794417142868, -0.006299734115600586, 0.004463322460651398, 0.015226386487483978, 0.025989443063735962, 0.036752503365278244, 0.047515563666820526, 0.05827862024307251, 0.06904168426990509, 0.07980474084615707, 0.09056779742240906, 0.10133086144924164, 0.11209391802549362, 0.1228569746017456, 0.13362003862857819, 0.14438310265541077, 0.15514615178108215, 0.16590921580791473, 0.17667227983474731, 0.1874353289604187, 0.19819839298725128, 0.20896145701408386, 0.21972450613975525, 0.23048757016658783, 0.2412506341934204, 0.2520136833190918, 0.2627767324447632, 0.27353981137275696, 0.28430286049842834, 0.29506590962409973, 0.3058289885520935, 0.3165920376777649, 0.3273550868034363, 0.33811816573143005, 0.34888121485710144, 0.3596442937850952, 0.3704073429107666]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 10.0, 8.0, 8.0, 18.0, 22.0, 29.0, 39.0, 49.0, 90.0, 131.0, 185.0, 288.0, 422.0, 747.0, 1145.0, 1834.0, 3222.0, 5519.0, 10593.0, 19899.0, 40067.0, 80268.0, 162332.0, 258843.0, 221296.0, 119874.0, 58793.0, 29133.0, 14767.0, 7928.0, 4456.0, 2516.0, 1484.0, 898.0, 567.0, 354.0, 241.0, 163.0, 116.0, 59.0, 37.0, 28.0, 23.0, 18.0, 17.0, 8.0, 3.0, 6.0, 3.0, 1.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.171630859375, -0.16586685180664062, -0.16010284423828125, -0.15433883666992188, -0.1485748291015625, -0.14281082153320312, -0.13704681396484375, -0.13128280639648438, -0.125518798828125, -0.11975479125976562, -0.11399078369140625, -0.10822677612304688, -0.1024627685546875, -0.09669876098632812, -0.09093475341796875, -0.08517074584960938, -0.07940673828125, -0.07364273071289062, -0.06787872314453125, -0.062114715576171875, -0.0563507080078125, -0.050586700439453125, -0.04482269287109375, -0.039058685302734375, -0.033294677734375, -0.027530670166015625, -0.02176666259765625, -0.016002655029296875, -0.0102386474609375, -0.004474639892578125, 0.00128936767578125, 0.007053375244140625, 0.0128173828125, 0.018581390380859375, 0.02434539794921875, 0.030109405517578125, 0.0358734130859375, 0.041637420654296875, 0.04740142822265625, 0.053165435791015625, 0.058929443359375, 0.06469345092773438, 0.07045745849609375, 0.07622146606445312, 0.0819854736328125, 0.08774948120117188, 0.09351348876953125, 0.09927749633789062, 0.10504150390625, 0.11080551147460938, 0.11656951904296875, 0.12233352661132812, 0.1280975341796875, 0.13386154174804688, 0.13962554931640625, 0.14538955688476562, 0.151153564453125, 0.15691757202148438, 0.16268157958984375, 0.16844558715820312, 0.1742095947265625, 0.17997360229492188, 0.18573760986328125, 0.19150161743164062, 0.197265625]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 3.0, 9.0, 4.0, 15.0, 8.0, 7.0, 18.0, 12.0, 27.0, 21.0, 28.0, 32.0, 41.0, 46.0, 51.0, 33.0, 51.0, 53.0, 51.0, 58.0, 49.0, 50.0, 42.0, 44.0, 34.0, 34.0, 20.0, 25.0, 18.0, 22.0, 24.0, 14.0, 13.0, 5.0, 9.0, 8.0, 6.0, 7.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0985107421875, -0.09549903869628906, -0.09248733520507812, -0.08947563171386719, -0.08646392822265625, -0.08345222473144531, -0.08044052124023438, -0.07742881774902344, -0.0744171142578125, -0.07140541076660156, -0.06839370727539062, -0.06538200378417969, -0.06237030029296875, -0.05935859680175781, -0.056346893310546875, -0.05333518981933594, -0.050323486328125, -0.04731178283691406, -0.044300079345703125, -0.04128837585449219, -0.03827667236328125, -0.03526496887207031, -0.032253265380859375, -0.029241561889648438, -0.0262298583984375, -0.023218154907226562, -0.020206451416015625, -0.017194747924804688, -0.01418304443359375, -0.011171340942382812, -0.008159637451171875, -0.0051479339599609375, -0.00213623046875, 0.0008754730224609375, 0.003887176513671875, 0.0068988800048828125, 0.00991058349609375, 0.012922286987304688, 0.015933990478515625, 0.018945693969726562, 0.0219573974609375, 0.024969100952148438, 0.027980804443359375, 0.030992507934570312, 0.03400421142578125, 0.03701591491699219, 0.040027618408203125, 0.04303932189941406, 0.046051025390625, 0.04906272888183594, 0.052074432373046875, 0.05508613586425781, 0.05809783935546875, 0.06110954284667969, 0.06412124633789062, 0.06713294982910156, 0.0701446533203125, 0.07315635681152344, 0.07616806030273438, 0.07917976379394531, 0.08219146728515625, 0.08520317077636719, 0.08821487426757812, 0.09122657775878906, 0.09423828125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 3.0, 0.0, 5.0, 4.0, 12.0, 12.0, 14.0, 18.0, 36.0, 66.0, 116.0, 175.0, 373.0, 700.0, 1530.0, 5793.0, 49294.0, 798592.0, 175836.0, 11633.0, 2411.0, 912.0, 456.0, 244.0, 122.0, 71.0, 47.0, 27.0, 17.0, 11.0, 12.0, 6.0, 3.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.552734375, -0.526031494140625, -0.49932861328125, -0.472625732421875, -0.4459228515625, -0.419219970703125, -0.39251708984375, -0.365814208984375, -0.339111328125, -0.312408447265625, -0.28570556640625, -0.259002685546875, -0.2322998046875, -0.205596923828125, -0.17889404296875, -0.152191162109375, -0.12548828125, -0.098785400390625, -0.07208251953125, -0.045379638671875, -0.0186767578125, 0.008026123046875, 0.03472900390625, 0.061431884765625, 0.088134765625, 0.114837646484375, 0.14154052734375, 0.168243408203125, 0.1949462890625, 0.221649169921875, 0.24835205078125, 0.275054931640625, 0.3017578125, 0.328460693359375, 0.35516357421875, 0.381866455078125, 0.4085693359375, 0.435272216796875, 0.46197509765625, 0.488677978515625, 0.515380859375, 0.542083740234375, 0.56878662109375, 0.595489501953125, 0.6221923828125, 0.648895263671875, 0.67559814453125, 0.702301025390625, 0.72900390625, 0.755706787109375, 0.78240966796875, 0.809112548828125, 0.8358154296875, 0.862518310546875, 0.88922119140625, 0.915924072265625, 0.942626953125, 0.969329833984375, 0.99603271484375, 1.022735595703125, 1.0494384765625, 1.076141357421875, 1.10284423828125, 1.129547119140625, 1.15625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 8.0, 9.0, 9.0, 19.0, 11.0, 15.0, 22.0, 22.0, 29.0, 38.0, 24.0, 23.0, 32.0, 35.0, 43.0, 57.0, 56.0, 48.0, 41.0, 44.0, 22.0, 37.0, 43.0, 42.0, 40.0, 34.0, 22.0, 25.0, 32.0, 19.0, 26.0, 17.0, 7.0, 17.0, 9.0, 9.0, 3.0, 2.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.39404296875, -0.379669189453125, -0.36529541015625, -0.350921630859375, -0.3365478515625, -0.322174072265625, -0.30780029296875, -0.293426513671875, -0.279052734375, -0.264678955078125, -0.25030517578125, -0.235931396484375, -0.2215576171875, -0.207183837890625, -0.19281005859375, -0.178436279296875, -0.1640625, -0.149688720703125, -0.13531494140625, -0.120941162109375, -0.1065673828125, -0.092193603515625, -0.07781982421875, -0.063446044921875, -0.049072265625, -0.034698486328125, -0.02032470703125, -0.005950927734375, 0.0084228515625, 0.022796630859375, 0.03717041015625, 0.051544189453125, 0.06591796875, 0.080291748046875, 0.09466552734375, 0.109039306640625, 0.1234130859375, 0.137786865234375, 0.15216064453125, 0.166534423828125, 0.180908203125, 0.195281982421875, 0.20965576171875, 0.224029541015625, 0.2384033203125, 0.252777099609375, 0.26715087890625, 0.281524658203125, 0.2958984375, 0.310272216796875, 0.32464599609375, 0.339019775390625, 0.3533935546875, 0.367767333984375, 0.38214111328125, 0.396514892578125, 0.410888671875, 0.425262451171875, 0.43963623046875, 0.454010009765625, 0.4683837890625, 0.482757568359375, 0.49713134765625, 0.511505126953125, 0.52587890625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 8.0, 13.0, 19.0, 32.0, 42.0, 73.0, 126.0, 190.0, 354.0, 857.0, 2157.0, 7496.0, 47215.0, 598421.0, 354192.0, 28581.0, 5531.0, 1785.0, 663.0, 341.0, 177.0, 103.0, 56.0, 46.0, 24.0, 8.0, 7.0, 10.0, 7.0, 5.0, 3.0, 5.0, 0.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.264892578125, -0.25331878662109375, -0.2417449951171875, -0.23017120361328125, -0.218597412109375, -0.20702362060546875, -0.1954498291015625, -0.18387603759765625, -0.17230224609375, -0.16072845458984375, -0.1491546630859375, -0.13758087158203125, -0.126007080078125, -0.11443328857421875, -0.1028594970703125, -0.09128570556640625, -0.0797119140625, -0.06813812255859375, -0.0565643310546875, -0.04499053955078125, -0.033416748046875, -0.02184295654296875, -0.0102691650390625, 0.00130462646484375, 0.01287841796875, 0.02445220947265625, 0.0360260009765625, 0.04759979248046875, 0.059173583984375, 0.07074737548828125, 0.0823211669921875, 0.09389495849609375, 0.10546875, 0.11704254150390625, 0.1286163330078125, 0.14019012451171875, 0.151763916015625, 0.16333770751953125, 0.1749114990234375, 0.18648529052734375, 0.19805908203125, 0.20963287353515625, 0.2212066650390625, 0.23278045654296875, 0.244354248046875, 0.25592803955078125, 0.2675018310546875, 0.27907562255859375, 0.2906494140625, 0.30222320556640625, 0.3137969970703125, 0.32537078857421875, 0.336944580078125, 0.34851837158203125, 0.3600921630859375, 0.37166595458984375, 0.38323974609375, 0.39481353759765625, 0.4063873291015625, 0.41796112060546875, 0.429534912109375, 0.44110870361328125, 0.4526824951171875, 0.46425628662109375, 0.475830078125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 8.0, 4.0, 10.0, 14.0, 18.0, 22.0, 21.0, 33.0, 43.0, 46.0, 48.0, 66.0, 82.0, 89.0, 91.0, 60.0, 70.0, 60.0, 40.0, 38.0, 19.0, 31.0, 16.0, 16.0, 13.0, 14.0, 4.0, 6.0, 3.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-9.79304313659668e-05, -9.486079216003418e-05, -9.179115295410156e-05, -8.872151374816895e-05, -8.565187454223633e-05, -8.258223533630371e-05, -7.95125961303711e-05, -7.644295692443848e-05, -7.337331771850586e-05, -7.030367851257324e-05, -6.723403930664062e-05, -6.416440010070801e-05, -6.109476089477539e-05, -5.8025121688842773e-05, -5.4955482482910156e-05, -5.188584327697754e-05, -4.881620407104492e-05, -4.5746564865112305e-05, -4.267692565917969e-05, -3.960728645324707e-05, -3.653764724731445e-05, -3.3468008041381836e-05, -3.039836883544922e-05, -2.73287296295166e-05, -2.4259090423583984e-05, -2.1189451217651367e-05, -1.811981201171875e-05, -1.5050172805786133e-05, -1.1980533599853516e-05, -8.910894393920898e-06, -5.841255187988281e-06, -2.771615982055664e-06, 2.980232238769531e-07, 3.3676624298095703e-06, 6.4373016357421875e-06, 9.506940841674805e-06, 1.2576580047607422e-05, 1.564621925354004e-05, 1.8715858459472656e-05, 2.1785497665405273e-05, 2.485513687133789e-05, 2.7924776077270508e-05, 3.0994415283203125e-05, 3.406405448913574e-05, 3.713369369506836e-05, 4.0203332901000977e-05, 4.3272972106933594e-05, 4.634261131286621e-05, 4.941225051879883e-05, 5.2481889724731445e-05, 5.555152893066406e-05, 5.862116813659668e-05, 6.16908073425293e-05, 6.476044654846191e-05, 6.783008575439453e-05, 7.089972496032715e-05, 7.396936416625977e-05, 7.703900337219238e-05, 8.0108642578125e-05, 8.317828178405762e-05, 8.624792098999023e-05, 8.931756019592285e-05, 9.238719940185547e-05, 9.545683860778809e-05, 9.85264778137207e-05]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 5.0, 2.0, 3.0, 5.0, 4.0, 8.0, 8.0, 13.0, 9.0, 32.0, 22.0, 60.0, 93.0, 123.0, 207.0, 315.0, 559.0, 1062.0, 2216.0, 5828.0, 23379.0, 155656.0, 636744.0, 184233.0, 26743.0, 6576.0, 2254.0, 1041.0, 548.0, 296.0, 170.0, 114.0, 80.0, 44.0, 33.0, 22.0, 19.0, 13.0, 7.0, 5.0, 1.0, 6.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.267333984375, -0.25885772705078125, -0.2503814697265625, -0.24190521240234375, -0.233428955078125, -0.22495269775390625, -0.2164764404296875, -0.20800018310546875, -0.19952392578125, -0.19104766845703125, -0.1825714111328125, -0.17409515380859375, -0.165618896484375, -0.15714263916015625, -0.1486663818359375, -0.14019012451171875, -0.1317138671875, -0.12323760986328125, -0.1147613525390625, -0.10628509521484375, -0.097808837890625, -0.08933258056640625, -0.0808563232421875, -0.07238006591796875, -0.06390380859375, -0.05542755126953125, -0.0469512939453125, -0.03847503662109375, -0.029998779296875, -0.02152252197265625, -0.0130462646484375, -0.00457000732421875, 0.00390625, 0.01238250732421875, 0.0208587646484375, 0.02933502197265625, 0.037811279296875, 0.04628753662109375, 0.0547637939453125, 0.06324005126953125, 0.07171630859375, 0.08019256591796875, 0.0886688232421875, 0.09714508056640625, 0.105621337890625, 0.11409759521484375, 0.1225738525390625, 0.13105010986328125, 0.1395263671875, 0.14800262451171875, 0.1564788818359375, 0.16495513916015625, 0.173431396484375, 0.18190765380859375, 0.1903839111328125, 0.19886016845703125, 0.20733642578125, 0.21581268310546875, 0.2242889404296875, 0.23276519775390625, 0.241241455078125, 0.24971771240234375, 0.2581939697265625, 0.26667022705078125, 0.275146484375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 5.0, 2.0, 9.0, 19.0, 12.0, 10.0, 21.0, 26.0, 30.0, 33.0, 54.0, 62.0, 73.0, 73.0, 89.0, 83.0, 73.0, 67.0, 62.0, 46.0, 44.0, 25.0, 23.0, 15.0, 16.0, 10.0, 13.0, 4.0, 0.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.18017578125, -0.17345809936523438, -0.16674041748046875, -0.16002273559570312, -0.1533050537109375, -0.14658737182617188, -0.13986968994140625, -0.13315200805664062, -0.126434326171875, -0.11971664428710938, -0.11299896240234375, -0.10628128051757812, -0.0995635986328125, -0.09284591674804688, -0.08612823486328125, -0.07941055297851562, -0.07269287109375, -0.06597518920898438, -0.05925750732421875, -0.052539825439453125, -0.0458221435546875, -0.039104461669921875, -0.03238677978515625, -0.025669097900390625, -0.018951416015625, -0.012233734130859375, -0.00551605224609375, 0.001201629638671875, 0.0079193115234375, 0.014636993408203125, 0.02135467529296875, 0.028072357177734375, 0.0347900390625, 0.041507720947265625, 0.04822540283203125, 0.054943084716796875, 0.0616607666015625, 0.06837844848632812, 0.07509613037109375, 0.08181381225585938, 0.088531494140625, 0.09524917602539062, 0.10196685791015625, 0.10868453979492188, 0.1154022216796875, 0.12211990356445312, 0.12883758544921875, 0.13555526733398438, 0.14227294921875, 0.14899063110351562, 0.15570831298828125, 0.16242599487304688, 0.1691436767578125, 0.17586135864257812, 0.18257904052734375, 0.18929672241210938, 0.196014404296875, 0.20273208618164062, 0.20944976806640625, 0.21616744995117188, 0.2228851318359375, 0.22960281372070312, 0.23632049560546875, 0.24303817749023438, 0.249755859375]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 16.0, 23.0, 42.0, 78.0, 114.0, 178.0, 176.0, 149.0, 106.0, 58.0, 28.0, 17.0, 11.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.5629000663757324, -3.409046173095703, -3.255192279815674, -3.1013383865356445, -2.9474844932556152, -2.793630599975586, -2.6397764682769775, -2.4859225749969482, -2.332068681716919, -2.1782147884368896, -2.0243608951568604, -1.8705068826675415, -1.7166529893875122, -1.562799096107483, -1.408945083618164, -1.2550911903381348, -1.1012372970581055, -0.9473834037780762, -0.7935294508934021, -0.639675498008728, -0.48582160472869873, -0.33196771144866943, -0.17811375856399536, -0.02425980567932129, 0.129594087600708, 0.2834480106830597, 0.4373019337654114, 0.5911558866500854, 0.7450097799301147, 0.898863673210144, 1.052717685699463, 1.2065715789794922, 1.3604249954223633, 1.5142788887023926, 1.6681327819824219, 1.8219867944717407, 1.97584068775177, 2.1296944618225098, 2.283548593521118, 2.4374024868011475, 2.5912563800811768, 2.745110273361206, 2.8989641666412354, 3.0528180599212646, 3.206672191619873, 3.3605260848999023, 3.5143799781799316, 3.668233871459961, 3.8220877647399902, 3.9759416580200195, 4.129795551300049, 4.283649444580078, 4.437503337860107, 4.591357231140137, 4.745211124420166, 4.899065017700195, 5.052919387817383, 5.206773281097412, 5.360627174377441, 5.514481067657471, 5.6683349609375, 5.822188854217529, 5.976042747497559, 6.129897117614746, 6.283750534057617]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 5.0, 2.0, 4.0, 5.0, 11.0, 12.0, 12.0, 9.0, 15.0, 20.0, 19.0, 28.0, 29.0, 39.0, 48.0, 46.0, 51.0, 61.0, 64.0, 59.0, 55.0, 47.0, 39.0, 39.0, 41.0, 28.0, 37.0, 30.0, 32.0, 19.0, 31.0, 9.0, 9.0, 10.0, 9.0, 10.0, 6.0, 4.0, 5.0, 2.0, 1.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.6403796672821045, -2.564349412918091, -2.488319158554077, -2.4122889041900635, -2.3362584114074707, -2.260228157043457, -2.1841979026794434, -2.1081676483154297, -2.032137393951416, -1.9561071395874023, -1.8800768852233887, -1.8040465116500854, -1.7280162572860718, -1.651986002922058, -1.5759556293487549, -1.4999253749847412, -1.4238951206207275, -1.3478648662567139, -1.2718346118927002, -1.195804238319397, -1.1197739839553833, -1.0437437295913696, -0.9677134156227112, -0.8916831016540527, -0.8156528472900391, -0.7396225929260254, -0.6635922789573669, -0.5875619649887085, -0.5115317106246948, -0.43550142645835876, -0.3594711422920227, -0.28344082832336426, -0.20741057395935059, -0.13138028979301453, -0.05535000562667847, 0.020680278539657593, 0.09671056270599365, 0.1727408468723297, 0.24877113103866577, 0.3248014450073242, 0.4008316993713379, 0.47686198353767395, 0.55289226770401, 0.6289225816726685, 0.7049528360366821, 0.7809830904006958, 0.8570134043693542, 0.9330437183380127, 1.0090739727020264, 1.08510422706604, 1.1611344814300537, 1.237164855003357, 1.3131951093673706, 1.3892253637313843, 1.4652557373046875, 1.5412859916687012, 1.6173162460327148, 1.6933465003967285, 1.7693767547607422, 1.8454071283340454, 1.921437382698059, 1.9974676370620728, 2.073498010635376, 2.1495282649993896, 2.2255585193634033]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 5.0, 3.0, 5.0, 7.0, 8.0, 13.0, 15.0, 24.0, 40.0, 53.0, 90.0, 193.0, 329.0, 630.0, 1515.0, 3994.0, 22896.0, 4124936.0, 31536.0, 4775.0, 1661.0, 728.0, 378.0, 154.0, 116.0, 70.0, 41.0, 17.0, 24.0, 8.0, 7.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.005859375, -0.9739837646484375, -0.942108154296875, -0.9102325439453125, -0.87835693359375, -0.8464813232421875, -0.814605712890625, -0.7827301025390625, -0.7508544921875, -0.7189788818359375, -0.687103271484375, -0.6552276611328125, -0.62335205078125, -0.5914764404296875, -0.559600830078125, -0.5277252197265625, -0.495849609375, -0.4639739990234375, -0.432098388671875, -0.4002227783203125, -0.36834716796875, -0.3364715576171875, -0.304595947265625, -0.2727203369140625, -0.2408447265625, -0.2089691162109375, -0.177093505859375, -0.1452178955078125, -0.11334228515625, -0.0814666748046875, -0.049591064453125, -0.0177154541015625, 0.01416015625, 0.0460357666015625, 0.077911376953125, 0.1097869873046875, 0.14166259765625, 0.1735382080078125, 0.205413818359375, 0.2372894287109375, 0.2691650390625, 0.3010406494140625, 0.332916259765625, 0.3647918701171875, 0.39666748046875, 0.4285430908203125, 0.460418701171875, 0.4922943115234375, 0.524169921875, 0.5560455322265625, 0.587921142578125, 0.6197967529296875, 0.65167236328125, 0.6835479736328125, 0.715423583984375, 0.7472991943359375, 0.7791748046875, 0.8110504150390625, 0.842926025390625, 0.8748016357421875, 0.90667724609375, 0.9385528564453125, 0.970428466796875, 1.0023040771484375, 1.0341796875]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 0.0, 4.0, 8.0, 6.0, 11.0, 10.0, 20.0, 23.0, 21.0, 31.0, 38.0, 40.0, 39.0, 49.0, 63.0, 54.0, 69.0, 59.0, 61.0, 53.0, 44.0, 48.0, 49.0, 40.0, 34.0, 35.0, 23.0, 19.0, 16.0, 10.0, 13.0, 8.0, 2.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11761474609375, -0.11374378204345703, -0.10987281799316406, -0.1060018539428711, -0.10213088989257812, -0.09825992584228516, -0.09438896179199219, -0.09051799774169922, -0.08664703369140625, -0.08277606964111328, -0.07890510559082031, -0.07503414154052734, -0.07116317749023438, -0.0672922134399414, -0.06342124938964844, -0.05955028533935547, -0.0556793212890625, -0.05180835723876953, -0.04793739318847656, -0.044066429138183594, -0.040195465087890625, -0.036324501037597656, -0.03245353698730469, -0.02858257293701172, -0.02471160888671875, -0.02084064483642578, -0.016969680786132812, -0.013098716735839844, -0.009227752685546875, -0.005356788635253906, -0.0014858245849609375, 0.0023851394653320312, 0.006256103515625, 0.010127067565917969, 0.013998031616210938, 0.017868995666503906, 0.021739959716796875, 0.025610923767089844, 0.029481887817382812, 0.03335285186767578, 0.03722381591796875, 0.04109477996826172, 0.04496574401855469, 0.048836708068847656, 0.052707672119140625, 0.056578636169433594, 0.06044960021972656, 0.06432056427001953, 0.0681915283203125, 0.07206249237060547, 0.07593345642089844, 0.0798044204711914, 0.08367538452148438, 0.08754634857177734, 0.09141731262207031, 0.09528827667236328, 0.09915924072265625, 0.10303020477294922, 0.10690116882324219, 0.11077213287353516, 0.11464309692382812, 0.1185140609741211, 0.12238502502441406, 0.12625598907470703, 0.130126953125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 8.0, 7.0, 8.0, 11.0, 36.0, 47.0, 74.0, 107.0, 149.0, 216.0, 385.0, 614.0, 1230.0, 2559.0, 7045.0, 45667.0, 4082654.0, 41526.0, 6691.0, 2400.0, 1191.0, 646.0, 363.0, 233.0, 145.0, 85.0, 71.0, 47.0, 27.0, 17.0, 9.0, 10.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.85986328125, -0.8296737670898438, -0.7994842529296875, -0.7692947387695312, -0.739105224609375, -0.7089157104492188, -0.6787261962890625, -0.6485366821289062, -0.61834716796875, -0.5881576538085938, -0.5579681396484375, -0.5277786254882812, -0.497589111328125, -0.46739959716796875, -0.4372100830078125, -0.40702056884765625, -0.3768310546875, -0.34664154052734375, -0.3164520263671875, -0.28626251220703125, -0.256072998046875, -0.22588348388671875, -0.1956939697265625, -0.16550445556640625, -0.13531494140625, -0.10512542724609375, -0.0749359130859375, -0.04474639892578125, -0.014556884765625, 0.01563262939453125, 0.0458221435546875, 0.07601165771484375, 0.106201171875, 0.13639068603515625, 0.1665802001953125, 0.19676971435546875, 0.226959228515625, 0.25714874267578125, 0.2873382568359375, 0.31752777099609375, 0.34771728515625, 0.37790679931640625, 0.4080963134765625, 0.43828582763671875, 0.468475341796875, 0.49866485595703125, 0.5288543701171875, 0.5590438842773438, 0.5892333984375, 0.6194229125976562, 0.6496124267578125, 0.6798019409179688, 0.709991455078125, 0.7401809692382812, 0.7703704833984375, 0.8005599975585938, 0.83074951171875, 0.8609390258789062, 0.8911285400390625, 0.9213180541992188, 0.951507568359375, 0.9816970825195312, 1.0118865966796875, 1.0420761108398438, 1.072265625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 6.0, 12.0, 22.0, 21.0, 56.0, 198.0, 3424.0, 190.0, 56.0, 31.0, 21.0, 12.0, 3.0, 5.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1597900390625, -0.1543731689453125, -0.148956298828125, -0.1435394287109375, -0.13812255859375, -0.1327056884765625, -0.127288818359375, -0.1218719482421875, -0.116455078125, -0.1110382080078125, -0.105621337890625, -0.1002044677734375, -0.09478759765625, -0.0893707275390625, -0.083953857421875, -0.0785369873046875, -0.0731201171875, -0.0677032470703125, -0.062286376953125, -0.0568695068359375, -0.05145263671875, -0.0460357666015625, -0.040618896484375, -0.0352020263671875, -0.02978515625, -0.0243682861328125, -0.018951416015625, -0.0135345458984375, -0.00811767578125, -0.0027008056640625, 0.002716064453125, 0.0081329345703125, 0.0135498046875, 0.0189666748046875, 0.024383544921875, 0.0298004150390625, 0.03521728515625, 0.0406341552734375, 0.046051025390625, 0.0514678955078125, 0.056884765625, 0.0623016357421875, 0.067718505859375, 0.0731353759765625, 0.07855224609375, 0.0839691162109375, 0.089385986328125, 0.0948028564453125, 0.1002197265625, 0.1056365966796875, 0.111053466796875, 0.1164703369140625, 0.12188720703125, 0.1273040771484375, 0.132720947265625, 0.1381378173828125, 0.1435546875, 0.1489715576171875, 0.154388427734375, 0.1598052978515625, 0.16522216796875, 0.1706390380859375, 0.176055908203125, 0.1814727783203125, 0.1868896484375]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 4.0, 5.0, 7.0, 11.0, 19.0, 25.0, 28.0, 48.0, 50.0, 55.0, 91.0, 103.0, 66.0, 101.0, 99.0, 67.0, 60.0, 44.0, 34.0, 25.0, 9.0, 15.0, 11.0, 6.0, 6.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5061824321746826, -0.49159905314445496, -0.4770156741142273, -0.46243229508399963, -0.447848916053772, -0.4332655668258667, -0.41868215799331665, -0.4040988087654114, -0.3895154297351837, -0.37493205070495605, -0.3603486716747284, -0.34576529264450073, -0.33118191361427307, -0.3165985345840454, -0.30201518535614014, -0.2874318063259125, -0.2728484272956848, -0.25826504826545715, -0.2436816692352295, -0.22909829020500183, -0.21451492607593536, -0.1999315470457077, -0.18534816801548004, -0.17076480388641357, -0.15618139505386353, -0.14159801602363586, -0.1270146369934082, -0.11243126541376114, -0.09784789383411407, -0.08326451480388641, -0.06868113577365875, -0.05409776419401169, -0.039514392614364624, -0.02493101730942726, -0.01034764014184475, 0.0042357370257377625, 0.018819112330675125, 0.03340248763561249, 0.04798586666584015, 0.06256923824548721, 0.07715261727571487, 0.09173599630594254, 0.1063193678855896, 0.12090274691581726, 0.13548612594604492, 0.15006950497627258, 0.16465288400650024, 0.1792362481355667, 0.19381962716579437, 0.20840300619602203, 0.2229863852262497, 0.23756974935531616, 0.2521531283855438, 0.2667365074157715, 0.28131988644599915, 0.2959032654762268, 0.31048664450645447, 0.32507002353668213, 0.3396534025669098, 0.35423678159713745, 0.3688201606273651, 0.3834035396575928, 0.39798688888549805, 0.4125702679157257, 0.42715364694595337]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 2.0, 5.0, 7.0, 9.0, 11.0, 5.0, 10.0, 4.0, 22.0, 23.0, 11.0, 26.0, 23.0, 29.0, 24.0, 18.0, 30.0, 31.0, 34.0, 30.0, 35.0, 47.0, 44.0, 53.0, 43.0, 48.0, 33.0, 43.0, 34.0, 37.0, 24.0, 25.0, 24.0, 22.0, 24.0, 13.0, 22.0, 11.0, 21.0, 9.0, 8.0, 6.0, 6.0, 4.0, 5.0, 2.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.2699427008628845, -0.26148009300231934, -0.25301751494407654, -0.24455492198467255, -0.23609232902526855, -0.22762973606586456, -0.21916714310646057, -0.21070455014705658, -0.2022419571876526, -0.1937793642282486, -0.1853167712688446, -0.1768541783094406, -0.16839158535003662, -0.15992899239063263, -0.15146639943122864, -0.14300380647182465, -0.13454121351242065, -0.12607862055301666, -0.11761602759361267, -0.10915343463420868, -0.10069084167480469, -0.0922282487154007, -0.0837656557559967, -0.07530306279659271, -0.06684046983718872, -0.05837787687778473, -0.04991528391838074, -0.041452690958976746, -0.032990097999572754, -0.024527505040168762, -0.01606491208076477, -0.007602319121360779, 0.0008602738380432129, 0.009322866797447205, 0.017785459756851196, 0.026248052716255188, 0.03471064567565918, 0.04317323863506317, 0.05163583159446716, 0.060098424553871155, 0.06856101751327515, 0.07702361047267914, 0.08548620343208313, 0.09394879639148712, 0.10241138935089111, 0.1108739823102951, 0.1193365752696991, 0.1277991682291031, 0.13626176118850708, 0.14472435414791107, 0.15318694710731506, 0.16164954006671906, 0.17011213302612305, 0.17857472598552704, 0.18703731894493103, 0.19549991190433502, 0.203962504863739, 0.212425097823143, 0.220887690782547, 0.229350283741951, 0.23781287670135498, 0.24627546966075897, 0.25473806262016296, 0.26320064067840576, 0.27166324853897095]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 6.0, 4.0, 6.0, 9.0, 9.0, 23.0, 19.0, 46.0, 59.0, 74.0, 103.0, 184.0, 297.0, 498.0, 905.0, 1477.0, 3163.0, 6761.0, 15375.0, 36677.0, 91389.0, 233658.0, 357672.0, 179193.0, 69821.0, 28128.0, 11850.0, 5427.0, 2556.0, 1330.0, 714.0, 378.0, 255.0, 147.0, 107.0, 67.0, 61.0, 32.0, 18.0, 17.0, 14.0, 8.0, 5.0, 7.0, 4.0, 2.0, 3.0, 3.0, 1.0, 2.0, 2.0], "bins": [-0.2496337890625, -0.24257278442382812, -0.23551177978515625, -0.22845077514648438, -0.2213897705078125, -0.21432876586914062, -0.20726776123046875, -0.20020675659179688, -0.193145751953125, -0.18608474731445312, -0.17902374267578125, -0.17196273803710938, -0.1649017333984375, -0.15784072875976562, -0.15077972412109375, -0.14371871948242188, -0.13665771484375, -0.12959671020507812, -0.12253570556640625, -0.11547470092773438, -0.1084136962890625, -0.10135269165039062, -0.09429168701171875, -0.08723068237304688, -0.080169677734375, -0.07310867309570312, -0.06604766845703125, -0.058986663818359375, -0.0519256591796875, -0.044864654541015625, -0.03780364990234375, -0.030742645263671875, -0.023681640625, -0.016620635986328125, -0.00955963134765625, -0.002498626708984375, 0.0045623779296875, 0.011623382568359375, 0.01868438720703125, 0.025745391845703125, 0.032806396484375, 0.039867401123046875, 0.04692840576171875, 0.053989410400390625, 0.0610504150390625, 0.06811141967773438, 0.07517242431640625, 0.08223342895507812, 0.08929443359375, 0.09635543823242188, 0.10341644287109375, 0.11047744750976562, 0.1175384521484375, 0.12459945678710938, 0.13166046142578125, 0.13872146606445312, 0.145782470703125, 0.15284347534179688, 0.15990447998046875, 0.16696548461914062, 0.1740264892578125, 0.18108749389648438, 0.18814849853515625, 0.19520950317382812, 0.2022705078125]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 6.0, 3.0, 8.0, 7.0, 6.0, 13.0, 18.0, 20.0, 20.0, 25.0, 27.0, 37.0, 54.0, 48.0, 70.0, 52.0, 58.0, 74.0, 65.0, 58.0, 44.0, 55.0, 49.0, 42.0, 24.0, 27.0, 21.0, 24.0, 18.0, 11.0, 13.0, 5.0, 3.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.127197265625, -0.12273025512695312, -0.11826324462890625, -0.11379623413085938, -0.1093292236328125, -0.10486221313476562, -0.10039520263671875, -0.09592819213867188, -0.091461181640625, -0.08699417114257812, -0.08252716064453125, -0.07806015014648438, -0.0735931396484375, -0.06912612915039062, -0.06465911865234375, -0.060192108154296875, -0.05572509765625, -0.051258087158203125, -0.04679107666015625, -0.042324066162109375, -0.0378570556640625, -0.033390045166015625, -0.02892303466796875, -0.024456024169921875, -0.019989013671875, -0.015522003173828125, -0.01105499267578125, -0.006587982177734375, -0.0021209716796875, 0.002346038818359375, 0.00681304931640625, 0.011280059814453125, 0.0157470703125, 0.020214080810546875, 0.02468109130859375, 0.029148101806640625, 0.0336151123046875, 0.038082122802734375, 0.04254913330078125, 0.047016143798828125, 0.051483154296875, 0.055950164794921875, 0.06041717529296875, 0.06488418579101562, 0.0693511962890625, 0.07381820678710938, 0.07828521728515625, 0.08275222778320312, 0.08721923828125, 0.09168624877929688, 0.09615325927734375, 0.10062026977539062, 0.1050872802734375, 0.10955429077148438, 0.11402130126953125, 0.11848831176757812, 0.122955322265625, 0.12742233276367188, 0.13188934326171875, 0.13635635375976562, 0.1408233642578125, 0.14529037475585938, 0.14975738525390625, 0.15422439575195312, 0.15869140625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 5.0, 5.0, 3.0, 3.0, 7.0, 8.0, 12.0, 26.0, 23.0, 52.0, 66.0, 80.0, 103.0, 177.0, 285.0, 409.0, 666.0, 1449.0, 3992.0, 20164.0, 257502.0, 704712.0, 47629.0, 6756.0, 1944.0, 938.0, 489.0, 364.0, 224.0, 137.0, 90.0, 66.0, 45.0, 41.0, 20.0, 16.0, 12.0, 12.0, 11.0, 5.0, 3.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5556640625, -0.537261962890625, -0.51885986328125, -0.500457763671875, -0.4820556640625, -0.463653564453125, -0.44525146484375, -0.426849365234375, -0.408447265625, -0.390045166015625, -0.37164306640625, -0.353240966796875, -0.3348388671875, -0.316436767578125, -0.29803466796875, -0.279632568359375, -0.26123046875, -0.242828369140625, -0.22442626953125, -0.206024169921875, -0.1876220703125, -0.169219970703125, -0.15081787109375, -0.132415771484375, -0.114013671875, -0.095611572265625, -0.07720947265625, -0.058807373046875, -0.0404052734375, -0.022003173828125, -0.00360107421875, 0.014801025390625, 0.033203125, 0.051605224609375, 0.07000732421875, 0.088409423828125, 0.1068115234375, 0.125213623046875, 0.14361572265625, 0.162017822265625, 0.180419921875, 0.198822021484375, 0.21722412109375, 0.235626220703125, 0.2540283203125, 0.272430419921875, 0.29083251953125, 0.309234619140625, 0.32763671875, 0.346038818359375, 0.36444091796875, 0.382843017578125, 0.4012451171875, 0.419647216796875, 0.43804931640625, 0.456451416015625, 0.474853515625, 0.493255615234375, 0.51165771484375, 0.530059814453125, 0.5484619140625, 0.566864013671875, 0.58526611328125, 0.603668212890625, 0.6220703125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 7.0, 9.0, 9.0, 5.0, 18.0, 22.0, 24.0, 20.0, 19.0, 21.0, 20.0, 29.0, 39.0, 31.0, 45.0, 49.0, 50.0, 39.0, 47.0, 39.0, 35.0, 36.0, 42.0, 38.0, 41.0, 29.0, 26.0, 28.0, 28.0, 23.0, 24.0, 18.0, 24.0, 10.0, 9.0, 14.0, 4.0, 8.0, 9.0, 5.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.467041015625, -0.4519615173339844, -0.43688201904296875, -0.4218025207519531, -0.4067230224609375, -0.3916435241699219, -0.37656402587890625, -0.3614845275878906, -0.346405029296875, -0.3313255310058594, -0.31624603271484375, -0.3011665344238281, -0.2860870361328125, -0.2710075378417969, -0.25592803955078125, -0.24084854125976562, -0.22576904296875, -0.21068954467773438, -0.19561004638671875, -0.18053054809570312, -0.1654510498046875, -0.15037155151367188, -0.13529205322265625, -0.12021255493164062, -0.105133056640625, -0.09005355834960938, -0.07497406005859375, -0.059894561767578125, -0.0448150634765625, -0.029735565185546875, -0.01465606689453125, 0.000423431396484375, 0.0155029296875, 0.030582427978515625, 0.04566192626953125, 0.060741424560546875, 0.0758209228515625, 0.09090042114257812, 0.10597991943359375, 0.12105941772460938, 0.136138916015625, 0.15121841430664062, 0.16629791259765625, 0.18137741088867188, 0.1964569091796875, 0.21153640747070312, 0.22661590576171875, 0.24169540405273438, 0.25677490234375, 0.2718544006347656, 0.28693389892578125, 0.3020133972167969, 0.3170928955078125, 0.3321723937988281, 0.34725189208984375, 0.3623313903808594, 0.377410888671875, 0.3924903869628906, 0.40756988525390625, 0.4226493835449219, 0.4377288818359375, 0.4528083801269531, 0.46788787841796875, 0.4829673767089844, 0.498046875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 7.0, 10.0, 18.0, 25.0, 33.0, 55.0, 85.0, 139.0, 261.0, 586.0, 1374.0, 4905.0, 33725.0, 599703.0, 378347.0, 23289.0, 3742.0, 1169.0, 491.0, 239.0, 138.0, 70.0, 45.0, 22.0, 24.0, 14.0, 7.0, 7.0, 5.0, 5.0, 5.0, 2.0, 0.0, 1.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.336181640625, -0.3256492614746094, -0.31511688232421875, -0.3045845031738281, -0.2940521240234375, -0.2835197448730469, -0.27298736572265625, -0.2624549865722656, -0.251922607421875, -0.24139022827148438, -0.23085784912109375, -0.22032546997070312, -0.2097930908203125, -0.19926071166992188, -0.18872833251953125, -0.17819595336914062, -0.16766357421875, -0.15713119506835938, -0.14659881591796875, -0.13606643676757812, -0.1255340576171875, -0.11500167846679688, -0.10446929931640625, -0.09393692016601562, -0.083404541015625, -0.07287216186523438, -0.06233978271484375, -0.051807403564453125, -0.0412750244140625, -0.030742645263671875, -0.02021026611328125, -0.009677886962890625, 0.0008544921875, 0.011386871337890625, 0.02191925048828125, 0.032451629638671875, 0.0429840087890625, 0.053516387939453125, 0.06404876708984375, 0.07458114624023438, 0.085113525390625, 0.09564590454101562, 0.10617828369140625, 0.11671066284179688, 0.1272430419921875, 0.13777542114257812, 0.14830780029296875, 0.15884017944335938, 0.16937255859375, 0.17990493774414062, 0.19043731689453125, 0.20096969604492188, 0.2115020751953125, 0.22203445434570312, 0.23256683349609375, 0.24309921264648438, 0.253631591796875, 0.2641639709472656, 0.27469635009765625, 0.2852287292480469, 0.2957611083984375, 0.3062934875488281, 0.31682586669921875, 0.3273582458496094, 0.337890625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 2.0, 7.0, 7.0, 2.0, 9.0, 9.0, 13.0, 17.0, 19.0, 22.0, 26.0, 43.0, 62.0, 87.0, 109.0, 119.0, 98.0, 75.0, 47.0, 47.0, 24.0, 33.0, 27.0, 32.0, 22.0, 9.0, 9.0, 7.0, 2.0, 5.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.07046890258789e-05, -7.765740156173706e-05, -7.461011409759521e-05, -7.156282663345337e-05, -6.851553916931152e-05, -6.546825170516968e-05, -6.242096424102783e-05, -5.9373676776885986e-05, -5.632638931274414e-05, -5.3279101848602295e-05, -5.023181438446045e-05, -4.7184526920318604e-05, -4.413723945617676e-05, -4.108995199203491e-05, -3.8042664527893066e-05, -3.499537706375122e-05, -3.1948089599609375e-05, -2.890080213546753e-05, -2.5853514671325684e-05, -2.2806227207183838e-05, -1.9758939743041992e-05, -1.6711652278900146e-05, -1.36643648147583e-05, -1.0617077350616455e-05, -7.569789886474609e-06, -4.522502422332764e-06, -1.475214958190918e-06, 1.5720725059509277e-06, 4.6193599700927734e-06, 7.666647434234619e-06, 1.0713934898376465e-05, 1.376122236251831e-05, 1.6808509826660156e-05, 1.9855797290802002e-05, 2.2903084754943848e-05, 2.5950372219085693e-05, 2.899765968322754e-05, 3.2044947147369385e-05, 3.509223461151123e-05, 3.8139522075653076e-05, 4.118680953979492e-05, 4.423409700393677e-05, 4.728138446807861e-05, 5.032867193222046e-05, 5.3375959396362305e-05, 5.642324686050415e-05, 5.9470534324645996e-05, 6.251782178878784e-05, 6.556510925292969e-05, 6.861239671707153e-05, 7.165968418121338e-05, 7.470697164535522e-05, 7.775425910949707e-05, 8.080154657363892e-05, 8.384883403778076e-05, 8.689612150192261e-05, 8.994340896606445e-05, 9.29906964302063e-05, 9.603798389434814e-05, 9.908527135848999e-05, 0.00010213255882263184, 0.00010517984628677368, 0.00010822713375091553, 0.00011127442121505737, 0.00011432170867919922]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 1.0, 6.0, 5.0, 6.0, 5.0, 4.0, 17.0, 29.0, 45.0, 72.0, 137.0, 257.0, 529.0, 1142.0, 3095.0, 14799.0, 181382.0, 766566.0, 68621.0, 8003.0, 2154.0, 827.0, 397.0, 191.0, 97.0, 68.0, 39.0, 22.0, 8.0, 7.0, 5.0, 9.0, 4.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 2.0, 2.0], "bins": [-0.445068359375, -0.4340324401855469, -0.42299652099609375, -0.4119606018066406, -0.4009246826171875, -0.3898887634277344, -0.37885284423828125, -0.3678169250488281, -0.356781005859375, -0.3457450866699219, -0.33470916748046875, -0.3236732482910156, -0.3126373291015625, -0.3016014099121094, -0.29056549072265625, -0.2795295715332031, -0.26849365234375, -0.2574577331542969, -0.24642181396484375, -0.23538589477539062, -0.2243499755859375, -0.21331405639648438, -0.20227813720703125, -0.19124221801757812, -0.180206298828125, -0.16917037963867188, -0.15813446044921875, -0.14709854125976562, -0.1360626220703125, -0.12502670288085938, -0.11399078369140625, -0.10295486450195312, -0.0919189453125, -0.08088302612304688, -0.06984710693359375, -0.058811187744140625, -0.0477752685546875, -0.036739349365234375, -0.02570343017578125, -0.014667510986328125, -0.003631591796875, 0.007404327392578125, 0.01844024658203125, 0.029476165771484375, 0.0405120849609375, 0.051548004150390625, 0.06258392333984375, 0.07361984252929688, 0.08465576171875, 0.09569168090820312, 0.10672760009765625, 0.11776351928710938, 0.1287994384765625, 0.13983535766601562, 0.15087127685546875, 0.16190719604492188, 0.172943115234375, 0.18397903442382812, 0.19501495361328125, 0.20605087280273438, 0.2170867919921875, 0.22812271118164062, 0.23915863037109375, 0.2501945495605469, 0.26123046875]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 3.0, 5.0, 6.0, 7.0, 8.0, 15.0, 12.0, 29.0, 26.0, 21.0, 46.0, 45.0, 54.0, 56.0, 82.0, 94.0, 91.0, 79.0, 65.0, 51.0, 46.0, 32.0, 25.0, 21.0, 26.0, 20.0, 7.0, 10.0, 6.0, 4.0, 6.0, 4.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2149658203125, -0.20880889892578125, -0.2026519775390625, -0.19649505615234375, -0.190338134765625, -0.18418121337890625, -0.1780242919921875, -0.17186737060546875, -0.16571044921875, -0.15955352783203125, -0.1533966064453125, -0.14723968505859375, -0.141082763671875, -0.13492584228515625, -0.1287689208984375, -0.12261199951171875, -0.116455078125, -0.11029815673828125, -0.1041412353515625, -0.09798431396484375, -0.091827392578125, -0.08567047119140625, -0.0795135498046875, -0.07335662841796875, -0.06719970703125, -0.06104278564453125, -0.0548858642578125, -0.04872894287109375, -0.042572021484375, -0.03641510009765625, -0.0302581787109375, -0.02410125732421875, -0.0179443359375, -0.01178741455078125, -0.0056304931640625, 0.00052642822265625, 0.006683349609375, 0.01284027099609375, 0.0189971923828125, 0.02515411376953125, 0.03131103515625, 0.03746795654296875, 0.0436248779296875, 0.04978179931640625, 0.055938720703125, 0.06209564208984375, 0.0682525634765625, 0.07440948486328125, 0.08056640625, 0.08672332763671875, 0.0928802490234375, 0.09903717041015625, 0.105194091796875, 0.11135101318359375, 0.1175079345703125, 0.12366485595703125, 0.12982177734375, 0.13597869873046875, 0.1421356201171875, 0.14829254150390625, 0.154449462890625, 0.16060638427734375, 0.1667633056640625, 0.17292022705078125, 0.1790771484375]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 9.0, 10.0, 44.0, 87.0, 139.0, 194.0, 203.0, 142.0, 82.0, 53.0, 23.0, 8.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.191871643066406, -5.030223369598389, -4.868575096130371, -4.706927299499512, -4.545279026031494, -4.383630752563477, -4.221982955932617, -4.0603346824646, -3.898686408996582, -3.7370381355285645, -3.575390100479126, -3.4137420654296875, -3.25209379196167, -3.0904455184936523, -2.928797483444214, -2.7671494483947754, -2.605501174926758, -2.4438529014587402, -2.2822048664093018, -2.1205568313598633, -1.9589085578918457, -1.7972604036331177, -1.6356122493743896, -1.4739640951156616, -1.3123159408569336, -1.1506677865982056, -0.9890196323394775, -0.8273714780807495, -0.6657233238220215, -0.5040751695632935, -0.34242701530456543, -0.1807788610458374, -0.019130229949951172, 0.14251792430877686, 0.3041660785675049, 0.4658142328262329, 0.6274623870849609, 0.789110541343689, 0.950758695602417, 1.112406849861145, 1.274055004119873, 1.435703158378601, 1.597351312637329, 1.7589994668960571, 1.9206476211547852, 2.0822958946228027, 2.243943929672241, 2.4055919647216797, 2.5672402381896973, 2.728888511657715, 2.8905365467071533, 3.052184581756592, 3.2138328552246094, 3.375481128692627, 3.5371291637420654, 3.698777198791504, 3.8604254722595215, 4.022073745727539, 4.183721542358398, 4.345369815826416, 4.507018089294434, 4.668666362762451, 4.830314636230469, 4.991962432861328, 5.153610706329346]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 7.0, 4.0, 7.0, 9.0, 13.0, 20.0, 27.0, 28.0, 29.0, 58.0, 42.0, 50.0, 57.0, 47.0, 63.0, 50.0, 54.0, 66.0, 56.0, 57.0, 28.0, 37.0, 24.0, 23.0, 32.0, 28.0, 15.0, 13.0, 12.0, 10.0, 9.0, 6.0, 7.0, 6.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.012929677963257, -2.918456554412842, -2.8239834308624268, -2.7295103073120117, -2.6350371837615967, -2.5405640602111816, -2.4460911750793457, -2.3516178131103516, -2.2571449279785156, -2.1626718044281006, -2.0681986808776855, -1.9737255573272705, -1.8792524337768555, -1.7847793102264404, -1.690306305885315, -1.5958331823349, -1.5013599395751953, -1.4068868160247803, -1.3124136924743652, -1.2179405689239502, -1.1234674453735352, -1.0289943218231201, -0.9345213174819946, -0.8400481939315796, -0.7455750703811646, -0.6511019468307495, -0.5566288232803345, -0.4621557593345642, -0.36768263578414917, -0.27320951223373413, -0.17873644828796387, -0.08426332473754883, 0.01020956039428711, 0.10468266904354095, 0.1991557776927948, 0.29362887144088745, 0.3881019949913025, 0.48257511854171753, 0.5770481824874878, 0.6715213060379028, 0.7659944295883179, 0.8604675531387329, 0.954940676689148, 1.0494136810302734, 1.1438868045806885, 1.2383599281311035, 1.3328330516815186, 1.4273061752319336, 1.5217792987823486, 1.6162524223327637, 1.7107255458831787, 1.8051986694335938, 1.8996717929840088, 1.9941449165344238, 2.0886178016662598, 2.183091163635254, 2.27756404876709, 2.372037172317505, 2.46651029586792, 2.560983419418335, 2.65545654296875, 2.749929666519165, 2.84440279006958, 2.938875675201416, 3.03334903717041]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 6.0, 10.0, 14.0, 11.0, 14.0, 23.0, 34.0, 39.0, 48.0, 75.0, 137.0, 176.0, 276.0, 446.0, 684.0, 1165.0, 2321.0, 4740.0, 13963.0, 69278.0, 3898357.0, 166350.0, 22636.0, 6737.0, 2852.0, 1553.0, 823.0, 510.0, 322.0, 236.0, 142.0, 109.0, 65.0, 48.0, 27.0, 15.0, 13.0, 12.0, 6.0, 4.0, 2.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.47412109375, -0.4586639404296875, -0.443206787109375, -0.4277496337890625, -0.41229248046875, -0.3968353271484375, -0.381378173828125, -0.3659210205078125, -0.3504638671875, -0.3350067138671875, -0.319549560546875, -0.3040924072265625, -0.28863525390625, -0.2731781005859375, -0.257720947265625, -0.2422637939453125, -0.226806640625, -0.2113494873046875, -0.195892333984375, -0.1804351806640625, -0.16497802734375, -0.1495208740234375, -0.134063720703125, -0.1186065673828125, -0.1031494140625, -0.0876922607421875, -0.072235107421875, -0.0567779541015625, -0.04132080078125, -0.0258636474609375, -0.010406494140625, 0.0050506591796875, 0.0205078125, 0.0359649658203125, 0.051422119140625, 0.0668792724609375, 0.08233642578125, 0.0977935791015625, 0.113250732421875, 0.1287078857421875, 0.1441650390625, 0.1596221923828125, 0.175079345703125, 0.1905364990234375, 0.20599365234375, 0.2214508056640625, 0.236907958984375, 0.2523651123046875, 0.267822265625, 0.2832794189453125, 0.298736572265625, 0.3141937255859375, 0.32965087890625, 0.3451080322265625, 0.360565185546875, 0.3760223388671875, 0.3914794921875, 0.4069366455078125, 0.422393798828125, 0.4378509521484375, 0.45330810546875, 0.4687652587890625, 0.484222412109375, 0.4996795654296875, 0.51513671875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 1.0, 1.0, 2.0, 4.0, 9.0, 3.0, 8.0, 17.0, 16.0, 18.0, 23.0, 23.0, 33.0, 38.0, 48.0, 48.0, 50.0, 71.0, 66.0, 67.0, 53.0, 66.0, 60.0, 54.0, 34.0, 39.0, 32.0, 29.0, 13.0, 22.0, 13.0, 11.0, 5.0, 7.0, 11.0, 4.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.15478515625, -0.15075111389160156, -0.14671707153320312, -0.1426830291748047, -0.13864898681640625, -0.1346149444580078, -0.13058090209960938, -0.12654685974121094, -0.1225128173828125, -0.11847877502441406, -0.11444473266601562, -0.11041069030761719, -0.10637664794921875, -0.10234260559082031, -0.09830856323242188, -0.09427452087402344, -0.090240478515625, -0.08620643615722656, -0.08217239379882812, -0.07813835144042969, -0.07410430908203125, -0.07007026672363281, -0.06603622436523438, -0.06200218200683594, -0.0579681396484375, -0.05393409729003906, -0.049900054931640625, -0.04586601257324219, -0.04183197021484375, -0.03779792785644531, -0.033763885498046875, -0.029729843139648438, -0.02569580078125, -0.021661758422851562, -0.017627716064453125, -0.013593673706054688, -0.00955963134765625, -0.0055255889892578125, -0.001491546630859375, 0.0025424957275390625, 0.0065765380859375, 0.010610580444335938, 0.014644622802734375, 0.018678665161132812, 0.02271270751953125, 0.026746749877929688, 0.030780792236328125, 0.03481483459472656, 0.038848876953125, 0.04288291931152344, 0.046916961669921875, 0.05095100402832031, 0.05498504638671875, 0.05901908874511719, 0.06305313110351562, 0.06708717346191406, 0.0711212158203125, 0.07515525817871094, 0.07918930053710938, 0.08322334289550781, 0.08725738525390625, 0.09129142761230469, 0.09532546997070312, 0.09935951232910156, 0.1033935546875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 6.0, 7.0, 8.0, 6.0, 12.0, 11.0, 13.0, 20.0, 22.0, 33.0, 48.0, 69.0, 87.0, 120.0, 199.0, 361.0, 725.0, 1519.0, 4455.0, 21148.0, 3307784.0, 831421.0, 18939.0, 4131.0, 1432.0, 665.0, 388.0, 205.0, 118.0, 84.0, 62.0, 47.0, 37.0, 26.0, 18.0, 18.0, 10.0, 7.0, 2.0, 6.0, 3.0, 6.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-1.0595703125, -1.0301132202148438, -1.0006561279296875, -0.9711990356445312, -0.941741943359375, -0.9122848510742188, -0.8828277587890625, -0.8533706665039062, -0.82391357421875, -0.7944564819335938, -0.7649993896484375, -0.7355422973632812, -0.706085205078125, -0.6766281127929688, -0.6471710205078125, -0.6177139282226562, -0.5882568359375, -0.5587997436523438, -0.5293426513671875, -0.49988555908203125, -0.470428466796875, -0.44097137451171875, -0.4115142822265625, -0.38205718994140625, -0.35260009765625, -0.32314300537109375, -0.2936859130859375, -0.26422882080078125, -0.234771728515625, -0.20531463623046875, -0.1758575439453125, -0.14640045166015625, -0.116943359375, -0.08748626708984375, -0.0580291748046875, -0.02857208251953125, 0.000885009765625, 0.03034210205078125, 0.0597991943359375, 0.08925628662109375, 0.11871337890625, 0.14817047119140625, 0.1776275634765625, 0.20708465576171875, 0.236541748046875, 0.26599884033203125, 0.2954559326171875, 0.32491302490234375, 0.3543701171875, 0.38382720947265625, 0.4132843017578125, 0.44274139404296875, 0.472198486328125, 0.5016555786132812, 0.5311126708984375, 0.5605697631835938, 0.59002685546875, 0.6194839477539062, 0.6489410400390625, 0.6783981323242188, 0.707855224609375, 0.7373123168945312, 0.7667694091796875, 0.7962265014648438, 0.82568359375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 2.0, 12.0, 9.0, 13.0, 36.0, 87.0, 536.0, 3076.0, 183.0, 53.0, 27.0, 23.0, 8.0, 8.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.62060546875, -0.6062431335449219, -0.5918807983398438, -0.5775184631347656, -0.5631561279296875, -0.5487937927246094, -0.5344314575195312, -0.5200691223144531, -0.505706787109375, -0.4913444519042969, -0.47698211669921875, -0.4626197814941406, -0.4482574462890625, -0.4338951110839844, -0.41953277587890625, -0.4051704406738281, -0.39080810546875, -0.3764457702636719, -0.36208343505859375, -0.3477210998535156, -0.3333587646484375, -0.3189964294433594, -0.30463409423828125, -0.2902717590332031, -0.275909423828125, -0.2615470886230469, -0.24718475341796875, -0.23282241821289062, -0.2184600830078125, -0.20409774780273438, -0.18973541259765625, -0.17537307739257812, -0.1610107421875, -0.14664840698242188, -0.13228607177734375, -0.11792373657226562, -0.1035614013671875, -0.08919906616210938, -0.07483673095703125, -0.060474395751953125, -0.046112060546875, -0.031749725341796875, -0.01738739013671875, -0.003025054931640625, 0.0113372802734375, 0.025699615478515625, 0.04006195068359375, 0.054424285888671875, 0.06878662109375, 0.08314895629882812, 0.09751129150390625, 0.11187362670898438, 0.1262359619140625, 0.14059829711914062, 0.15496063232421875, 0.16932296752929688, 0.183685302734375, 0.19804763793945312, 0.21240997314453125, 0.22677230834960938, 0.2411346435546875, 0.2554969787597656, 0.26985931396484375, 0.2842216491699219, 0.298583984375]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 3.0, 5.0, 5.0, 5.0, 8.0, 11.0, 29.0, 42.0, 50.0, 66.0, 82.0, 69.0, 106.0, 102.0, 107.0, 71.0, 58.0, 61.0, 42.0, 27.0, 14.0, 13.0, 5.0, 5.0, 4.0, 7.0, 2.0, 0.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.9232059717178345, -0.8934664726257324, -0.8637269139289856, -0.8339874148368835, -0.8042478561401367, -0.7745083570480347, -0.7447688579559326, -0.7150293588638306, -0.6852898001670837, -0.6555503010749817, -0.6258107423782349, -0.5960712432861328, -0.5663317441940308, -0.5365921854972839, -0.5068526864051819, -0.47711315751075745, -0.447373628616333, -0.41763409972190857, -0.38789457082748413, -0.3581550717353821, -0.32841554284095764, -0.2986760139465332, -0.26893651485443115, -0.2391969859600067, -0.20945745706558228, -0.17971792817115784, -0.1499784141778946, -0.12023889273405075, -0.09049937129020691, -0.06075984239578247, -0.031020328402519226, -0.0012808144092559814, 0.02845865488052368, 0.05819817632436752, 0.08793769776821136, 0.1176772192120552, 0.14741674065589905, 0.1771562695503235, 0.20689578354358673, 0.23663529753684998, 0.2663748264312744, 0.29611435532569885, 0.3258538842201233, 0.35559338331222534, 0.3853329122066498, 0.4150724411010742, 0.44481194019317627, 0.4745514690876007, 0.5042909979820251, 0.5340304970741272, 0.563770055770874, 0.5935095548629761, 0.6232490539550781, 0.652988612651825, 0.682728111743927, 0.7124676704406738, 0.7422071695327759, 0.7719466686248779, 0.8016862273216248, 0.8314257264137268, 0.8611652851104736, 0.8909047842025757, 0.9206442832946777, 0.9503837823867798, 0.9801233410835266]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 10.0, 12.0, 10.0, 8.0, 13.0, 7.0, 23.0, 28.0, 26.0, 26.0, 25.0, 33.0, 37.0, 36.0, 51.0, 40.0, 38.0, 52.0, 55.0, 40.0, 47.0, 42.0, 49.0, 37.0, 31.0, 37.0, 33.0, 24.0, 29.0, 13.0, 20.0, 14.0, 11.0, 13.0, 9.0, 8.0, 4.0, 1.0, 5.0, 1.0, 7.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.7504131197929382, -0.7291819453239441, -0.7079508304595947, -0.6867196559906006, -0.6654884815216064, -0.6442573666572571, -0.6230261921882629, -0.6017950773239136, -0.5805639028549194, -0.5593327283859253, -0.5381016135215759, -0.5168704390525818, -0.49563929438591003, -0.4744081497192383, -0.45317697525024414, -0.4319458305835724, -0.41071468591690063, -0.3894835412502289, -0.36825239658355713, -0.347021222114563, -0.32579007744789124, -0.3045589327812195, -0.28332775831222534, -0.2620966136455536, -0.24086546897888184, -0.21963432431221008, -0.19840316474437714, -0.1771720051765442, -0.15594086050987244, -0.13470971584320068, -0.11347855627536774, -0.09224739670753479, -0.07101625204086304, -0.04978509992361069, -0.028553947806358337, -0.0073227956891059875, 0.013908356428146362, 0.03513950854539871, 0.05637066066265106, 0.07760182023048401, 0.09883296489715576, 0.12006411701440811, 0.14129526913166046, 0.1625264286994934, 0.18375757336616516, 0.20498871803283691, 0.22621987760066986, 0.2474510371685028, 0.26868218183517456, 0.2899133265018463, 0.31114447116851807, 0.3323756456375122, 0.35360679030418396, 0.3748379349708557, 0.39606910943984985, 0.4173002541065216, 0.43853139877319336, 0.4597625434398651, 0.48099368810653687, 0.502224862575531, 0.5234559774398804, 0.5446871519088745, 0.5659183263778687, 0.5871495008468628, 0.6083806157112122]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 4.0, 2.0, 6.0, 11.0, 16.0, 26.0, 39.0, 71.0, 103.0, 149.0, 269.0, 463.0, 794.0, 1437.0, 2637.0, 4963.0, 9640.0, 20112.0, 42131.0, 89385.0, 209963.0, 362416.0, 163017.0, 72860.0, 34241.0, 16373.0, 8109.0, 4161.0, 2247.0, 1268.0, 687.0, 380.0, 208.0, 143.0, 82.0, 41.0, 39.0, 20.0, 12.0, 10.0, 9.0, 5.0, 6.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.269775390625, -0.2608909606933594, -0.25200653076171875, -0.24312210083007812, -0.2342376708984375, -0.22535324096679688, -0.21646881103515625, -0.20758438110351562, -0.198699951171875, -0.18981552124023438, -0.18093109130859375, -0.17204666137695312, -0.1631622314453125, -0.15427780151367188, -0.14539337158203125, -0.13650894165039062, -0.12762451171875, -0.11874008178710938, -0.10985565185546875, -0.10097122192382812, -0.0920867919921875, -0.08320236206054688, -0.07431793212890625, -0.06543350219726562, -0.056549072265625, -0.047664642333984375, -0.03878021240234375, -0.029895782470703125, -0.0210113525390625, -0.012126922607421875, -0.00324249267578125, 0.005641937255859375, 0.0145263671875, 0.023410797119140625, 0.03229522705078125, 0.041179656982421875, 0.0500640869140625, 0.058948516845703125, 0.06783294677734375, 0.07671737670898438, 0.085601806640625, 0.09448623657226562, 0.10337066650390625, 0.11225509643554688, 0.1211395263671875, 0.13002395629882812, 0.13890838623046875, 0.14779281616210938, 0.15667724609375, 0.16556167602539062, 0.17444610595703125, 0.18333053588867188, 0.1922149658203125, 0.20109939575195312, 0.20998382568359375, 0.21886825561523438, 0.227752685546875, 0.23663711547851562, 0.24552154541015625, 0.2544059753417969, 0.2632904052734375, 0.2721748352050781, 0.28105926513671875, 0.2899436950683594, 0.298828125]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 5.0, 10.0, 5.0, 16.0, 17.0, 15.0, 13.0, 35.0, 36.0, 29.0, 46.0, 49.0, 62.0, 57.0, 58.0, 49.0, 66.0, 54.0, 62.0, 48.0, 42.0, 44.0, 38.0, 29.0, 28.0, 18.0, 24.0, 10.0, 6.0, 10.0, 8.0, 2.0, 5.0, 2.0, 1.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1690673828125, -0.16436004638671875, -0.1596527099609375, -0.15494537353515625, -0.150238037109375, -0.14553070068359375, -0.1408233642578125, -0.13611602783203125, -0.13140869140625, -0.12670135498046875, -0.1219940185546875, -0.11728668212890625, -0.112579345703125, -0.10787200927734375, -0.1031646728515625, -0.09845733642578125, -0.09375, -0.08904266357421875, -0.0843353271484375, -0.07962799072265625, -0.074920654296875, -0.07021331787109375, -0.0655059814453125, -0.06079864501953125, -0.05609130859375, -0.05138397216796875, -0.0466766357421875, -0.04196929931640625, -0.037261962890625, -0.03255462646484375, -0.0278472900390625, -0.02313995361328125, -0.0184326171875, -0.01372528076171875, -0.0090179443359375, -0.00431060791015625, 0.000396728515625, 0.00510406494140625, 0.0098114013671875, 0.01451873779296875, 0.01922607421875, 0.02393341064453125, 0.0286407470703125, 0.03334808349609375, 0.038055419921875, 0.04276275634765625, 0.0474700927734375, 0.05217742919921875, 0.056884765625, 0.06159210205078125, 0.0662994384765625, 0.07100677490234375, 0.075714111328125, 0.08042144775390625, 0.0851287841796875, 0.08983612060546875, 0.09454345703125, 0.09925079345703125, 0.1039581298828125, 0.10866546630859375, 0.113372802734375, 0.11808013916015625, 0.1227874755859375, 0.12749481201171875, 0.1322021484375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 11.0, 5.0, 8.0, 13.0, 12.0, 27.0, 41.0, 52.0, 75.0, 171.0, 252.0, 371.0, 576.0, 1171.0, 2708.0, 9987.0, 82112.0, 796453.0, 134588.0, 13570.0, 3244.0, 1323.0, 672.0, 434.0, 234.0, 145.0, 100.0, 54.0, 43.0, 30.0, 23.0, 13.0, 7.0, 6.0, 7.0, 4.0, 3.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.91943359375, -0.8949737548828125, -0.870513916015625, -0.8460540771484375, -0.82159423828125, -0.7971343994140625, -0.772674560546875, -0.7482147216796875, -0.7237548828125, -0.6992950439453125, -0.674835205078125, -0.6503753662109375, -0.62591552734375, -0.6014556884765625, -0.576995849609375, -0.5525360107421875, -0.528076171875, -0.5036163330078125, -0.479156494140625, -0.4546966552734375, -0.43023681640625, -0.4057769775390625, -0.381317138671875, -0.3568572998046875, -0.3323974609375, -0.3079376220703125, -0.283477783203125, -0.2590179443359375, -0.23455810546875, -0.2100982666015625, -0.185638427734375, -0.1611785888671875, -0.13671875, -0.1122589111328125, -0.087799072265625, -0.0633392333984375, -0.03887939453125, -0.0144195556640625, 0.010040283203125, 0.0345001220703125, 0.0589599609375, 0.0834197998046875, 0.107879638671875, 0.1323394775390625, 0.15679931640625, 0.1812591552734375, 0.205718994140625, 0.2301788330078125, 0.254638671875, 0.2790985107421875, 0.303558349609375, 0.3280181884765625, 0.35247802734375, 0.3769378662109375, 0.401397705078125, 0.4258575439453125, 0.4503173828125, 0.4747772216796875, 0.499237060546875, 0.5236968994140625, 0.54815673828125, 0.5726165771484375, 0.597076416015625, 0.6215362548828125, 0.64599609375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 10.0, 7.0, 12.0, 8.0, 8.0, 20.0, 17.0, 7.0, 22.0, 18.0, 21.0, 31.0, 35.0, 27.0, 45.0, 38.0, 49.0, 47.0, 48.0, 64.0, 43.0, 46.0, 37.0, 33.0, 41.0, 35.0, 31.0, 30.0, 36.0, 28.0, 26.0, 16.0, 9.0, 12.0, 9.0, 11.0, 10.0, 8.0, 4.0, 4.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.5634765625, -0.5464248657226562, -0.5293731689453125, -0.5123214721679688, -0.495269775390625, -0.47821807861328125, -0.4611663818359375, -0.44411468505859375, -0.42706298828125, -0.41001129150390625, -0.3929595947265625, -0.37590789794921875, -0.358856201171875, -0.34180450439453125, -0.3247528076171875, -0.30770111083984375, -0.2906494140625, -0.27359771728515625, -0.2565460205078125, -0.23949432373046875, -0.222442626953125, -0.20539093017578125, -0.1883392333984375, -0.17128753662109375, -0.15423583984375, -0.13718414306640625, -0.1201324462890625, -0.10308074951171875, -0.086029052734375, -0.06897735595703125, -0.0519256591796875, -0.03487396240234375, -0.017822265625, -0.00077056884765625, 0.0162811279296875, 0.03333282470703125, 0.050384521484375, 0.06743621826171875, 0.0844879150390625, 0.10153961181640625, 0.11859130859375, 0.13564300537109375, 0.1526947021484375, 0.16974639892578125, 0.186798095703125, 0.20384979248046875, 0.2209014892578125, 0.23795318603515625, 0.2550048828125, 0.27205657958984375, 0.2891082763671875, 0.30615997314453125, 0.323211669921875, 0.34026336669921875, 0.3573150634765625, 0.37436676025390625, 0.39141845703125, 0.40847015380859375, 0.4255218505859375, 0.44257354736328125, 0.459625244140625, 0.47667694091796875, 0.4937286376953125, 0.5107803344726562, 0.52783203125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 0.0, 5.0, 7.0, 6.0, 16.0, 22.0, 21.0, 27.0, 50.0, 97.0, 144.0, 269.0, 519.0, 1214.0, 2992.0, 8965.0, 39874.0, 407808.0, 523224.0, 47595.0, 9973.0, 3194.0, 1271.0, 558.0, 297.0, 171.0, 82.0, 49.0, 36.0, 21.0, 14.0, 13.0, 6.0, 7.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.30078125, -0.29219818115234375, -0.2836151123046875, -0.27503204345703125, -0.266448974609375, -0.25786590576171875, -0.2492828369140625, -0.24069976806640625, -0.23211669921875, -0.22353363037109375, -0.2149505615234375, -0.20636749267578125, -0.197784423828125, -0.18920135498046875, -0.1806182861328125, -0.17203521728515625, -0.1634521484375, -0.15486907958984375, -0.1462860107421875, -0.13770294189453125, -0.129119873046875, -0.12053680419921875, -0.1119537353515625, -0.10337066650390625, -0.09478759765625, -0.08620452880859375, -0.0776214599609375, -0.06903839111328125, -0.060455322265625, -0.05187225341796875, -0.0432891845703125, -0.03470611572265625, -0.026123046875, -0.01753997802734375, -0.0089569091796875, -0.00037384033203125, 0.008209228515625, 0.01679229736328125, 0.0253753662109375, 0.03395843505859375, 0.04254150390625, 0.05112457275390625, 0.0597076416015625, 0.06829071044921875, 0.076873779296875, 0.08545684814453125, 0.0940399169921875, 0.10262298583984375, 0.1112060546875, 0.11978912353515625, 0.1283721923828125, 0.13695526123046875, 0.145538330078125, 0.15412139892578125, 0.1627044677734375, 0.17128753662109375, 0.17987060546875, 0.18845367431640625, 0.1970367431640625, 0.20561981201171875, 0.214202880859375, 0.22278594970703125, 0.2313690185546875, 0.23995208740234375, 0.24853515625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 5.0, 11.0, 6.0, 10.0, 15.0, 20.0, 29.0, 32.0, 42.0, 68.0, 83.0, 95.0, 139.0, 128.0, 77.0, 50.0, 46.0, 30.0, 36.0, 22.0, 14.0, 19.0, 15.0, 2.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.00015687942504882812, -0.00015281885862350464, -0.00014875829219818115, -0.00014469772577285767, -0.00014063715934753418, -0.0001365765929222107, -0.0001325160264968872, -0.00012845546007156372, -0.00012439489364624023, -0.00012033432722091675, -0.00011627376079559326, -0.00011221319437026978, -0.00010815262794494629, -0.0001040920615196228, -0.00010003149509429932, -9.597092866897583e-05, -9.191036224365234e-05, -8.784979581832886e-05, -8.378922939300537e-05, -7.972866296768188e-05, -7.56680965423584e-05, -7.160753011703491e-05, -6.754696369171143e-05, -6.348639726638794e-05, -5.942583084106445e-05, -5.536526441574097e-05, -5.130469799041748e-05, -4.7244131565093994e-05, -4.318356513977051e-05, -3.912299871444702e-05, -3.5062432289123535e-05, -3.100186586380005e-05, -2.6941299438476562e-05, -2.2880733013153076e-05, -1.882016658782959e-05, -1.4759600162506104e-05, -1.0699033737182617e-05, -6.638467311859131e-06, -2.5779008865356445e-06, 1.4826655387878418e-06, 5.543231964111328e-06, 9.603798389434814e-06, 1.36643648147583e-05, 1.7724931240081787e-05, 2.1785497665405273e-05, 2.584606409072876e-05, 2.9906630516052246e-05, 3.396719694137573e-05, 3.802776336669922e-05, 4.2088329792022705e-05, 4.614889621734619e-05, 5.020946264266968e-05, 5.4270029067993164e-05, 5.833059549331665e-05, 6.239116191864014e-05, 6.645172834396362e-05, 7.051229476928711e-05, 7.45728611946106e-05, 7.863342761993408e-05, 8.269399404525757e-05, 8.675456047058105e-05, 9.081512689590454e-05, 9.487569332122803e-05, 9.893625974655151e-05, 0.000102996826171875]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 6.0, 2.0, 5.0, 13.0, 16.0, 17.0, 29.0, 35.0, 64.0, 85.0, 138.0, 228.0, 460.0, 871.0, 1882.0, 4776.0, 17520.0, 116173.0, 721552.0, 153939.0, 21004.0, 5489.0, 2147.0, 858.0, 512.0, 262.0, 156.0, 112.0, 63.0, 33.0, 27.0, 21.0, 15.0, 8.0, 11.0, 9.0, 9.0, 6.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2509765625, -0.24276351928710938, -0.23455047607421875, -0.22633743286132812, -0.2181243896484375, -0.20991134643554688, -0.20169830322265625, -0.19348526000976562, -0.185272216796875, -0.17705917358398438, -0.16884613037109375, -0.16063308715820312, -0.1524200439453125, -0.14420700073242188, -0.13599395751953125, -0.12778091430664062, -0.11956787109375, -0.11135482788085938, -0.10314178466796875, -0.09492874145507812, -0.0867156982421875, -0.07850265502929688, -0.07028961181640625, -0.062076568603515625, -0.053863525390625, -0.045650482177734375, -0.03743743896484375, -0.029224395751953125, -0.0210113525390625, -0.012798309326171875, -0.00458526611328125, 0.003627777099609375, 0.0118408203125, 0.020053863525390625, 0.02826690673828125, 0.036479949951171875, 0.0446929931640625, 0.052906036376953125, 0.06111907958984375, 0.06933212280273438, 0.077545166015625, 0.08575820922851562, 0.09397125244140625, 0.10218429565429688, 0.1103973388671875, 0.11861038208007812, 0.12682342529296875, 0.13503646850585938, 0.14324951171875, 0.15146255493164062, 0.15967559814453125, 0.16788864135742188, 0.1761016845703125, 0.18431472778320312, 0.19252777099609375, 0.20074081420898438, 0.208953857421875, 0.21716690063476562, 0.22537994384765625, 0.23359298706054688, 0.2418060302734375, 0.2500190734863281, 0.25823211669921875, 0.2664451599121094, 0.274658203125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 1.0, 8.0, 4.0, 5.0, 9.0, 6.0, 14.0, 10.0, 18.0, 33.0, 31.0, 33.0, 61.0, 56.0, 80.0, 88.0, 70.0, 68.0, 80.0, 46.0, 59.0, 48.0, 31.0, 20.0, 19.0, 24.0, 12.0, 7.0, 7.0, 11.0, 8.0, 3.0, 10.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0], "bins": [-0.205322265625, -0.1996936798095703, -0.19406509399414062, -0.18843650817871094, -0.18280792236328125, -0.17717933654785156, -0.17155075073242188, -0.1659221649169922, -0.1602935791015625, -0.1546649932861328, -0.14903640747070312, -0.14340782165527344, -0.13777923583984375, -0.13215065002441406, -0.12652206420898438, -0.12089347839355469, -0.115264892578125, -0.10963630676269531, -0.10400772094726562, -0.09837913513183594, -0.09275054931640625, -0.08712196350097656, -0.08149337768554688, -0.07586479187011719, -0.0702362060546875, -0.06460762023925781, -0.058979034423828125, -0.05335044860839844, -0.04772186279296875, -0.04209327697753906, -0.036464691162109375, -0.030836105346679688, -0.02520751953125, -0.019578933715820312, -0.013950347900390625, -0.008321762084960938, -0.00269317626953125, 0.0029354095458984375, 0.008563995361328125, 0.014192581176757812, 0.0198211669921875, 0.025449752807617188, 0.031078338623046875, 0.03670692443847656, 0.04233551025390625, 0.04796409606933594, 0.053592681884765625, 0.05922126770019531, 0.064849853515625, 0.07047843933105469, 0.07610702514648438, 0.08173561096191406, 0.08736419677734375, 0.09299278259277344, 0.09862136840820312, 0.10424995422363281, 0.1098785400390625, 0.11550712585449219, 0.12113571166992188, 0.12676429748535156, 0.13239288330078125, 0.13802146911621094, 0.14365005493164062, 0.1492786407470703, 0.1549072265625]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 1.0, 4.0, 6.0, 5.0, 10.0, 11.0, 22.0, 47.0, 72.0, 103.0, 138.0, 175.0, 151.0, 119.0, 68.0, 35.0, 19.0, 9.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.929521083831787, -4.779421806335449, -4.629322052001953, -4.479222774505615, -4.329123497009277, -4.1790242195129395, -4.028924942016602, -3.8788251876831055, -3.7287259101867676, -3.5786266326904297, -3.4285271167755127, -3.2784276008605957, -3.128328323364258, -2.97822904586792, -2.828129529953003, -2.678030014038086, -2.527930736541748, -2.37783145904541, -2.227731943130493, -2.077632427215576, -1.9275331497192383, -1.7774337530136108, -1.6273343563079834, -1.477234959602356, -1.3271355628967285, -1.177036166191101, -1.0269367694854736, -0.8768373727798462, -0.7267379760742188, -0.5766385793685913, -0.42653918266296387, -0.2764397859573364, -0.12634038925170898, 0.023759007453918457, 0.1738584041595459, 0.32395780086517334, 0.4740571975708008, 0.6241565942764282, 0.7742559909820557, 0.9243553876876831, 1.0744547843933105, 1.224554181098938, 1.3746535778045654, 1.5247529745101929, 1.6748523712158203, 1.8249517679214478, 1.9750511646270752, 2.125150680541992, 2.27524995803833, 2.425349235534668, 2.575448751449585, 2.725548267364502, 2.87564754486084, 3.0257468223571777, 3.1758463382720947, 3.3259458541870117, 3.4760451316833496, 3.6261444091796875, 3.7762439250946045, 3.9263434410095215, 4.076442718505859, 4.226541996002197, 4.376641273498535, 4.526741027832031, 4.676840305328369]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 10.0, 12.0, 11.0, 17.0, 20.0, 21.0, 25.0, 30.0, 25.0, 42.0, 37.0, 48.0, 51.0, 38.0, 68.0, 61.0, 60.0, 60.0, 48.0, 72.0, 33.0, 43.0, 18.0, 26.0, 26.0, 13.0, 18.0, 14.0, 8.0, 10.0, 9.0, 6.0, 4.0, 5.0, 4.0, 8.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.75789737701416, -2.66742205619812, -2.576946973800659, -2.486471652984619, -2.395996570587158, -2.305521249771118, -2.215045928955078, -2.124570846557617, -2.0340957641601562, -1.9436205625534058, -1.8531453609466553, -1.7626700401306152, -1.6721949577331543, -1.5817196369171143, -1.4912444353103638, -1.4007692337036133, -1.3102939128875732, -1.2198187112808228, -1.1293435096740723, -1.0388681888580322, -0.9483930468559265, -0.857917845249176, -0.7674425840377808, -0.6769673824310303, -0.5864921808242798, -0.4960169792175293, -0.4055417478084564, -0.31506651639938354, -0.22459131479263306, -0.13411611318588257, -0.043640851974487305, 0.046834349632263184, 0.13730931282043457, 0.22778452932834625, 0.31825974583625793, 0.4087349772453308, 0.4992101788520813, 0.5896853804588318, 0.680160641670227, 0.7706358432769775, 0.861111044883728, 0.9515862464904785, 1.042061448097229, 1.1325366497039795, 1.2230119705200195, 1.3134870529174805, 1.4039623737335205, 1.494437575340271, 1.5849127769470215, 1.675387978553772, 1.7658631801605225, 1.8563385009765625, 1.9468135833740234, 2.0372889041900635, 2.1277642250061035, 2.2182393074035645, 2.3087143898010254, 2.3991897106170654, 2.4896647930145264, 2.5801401138305664, 2.6706151962280273, 2.7610905170440674, 2.8515658378601074, 2.9420409202575684, 3.0325162410736084]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 5.0, 4.0, 7.0, 5.0, 5.0, 20.0, 17.0, 14.0, 30.0, 46.0, 53.0, 76.0, 107.0, 148.0, 155.0, 248.0, 387.0, 546.0, 809.0, 1247.0, 2185.0, 3647.0, 6778.0, 14012.0, 32301.0, 95929.0, 534029.0, 2824231.0, 520138.0, 95482.0, 31880.0, 13690.0, 6572.0, 3648.0, 2086.0, 1231.0, 763.0, 527.0, 354.0, 221.0, 206.0, 129.0, 96.0, 58.0, 45.0, 30.0, 26.0, 23.0, 13.0, 13.0, 12.0, 5.0, 3.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.226806640625, -0.2191162109375, -0.21142578125, -0.2037353515625, -0.196044921875, -0.1883544921875, -0.1806640625, -0.1729736328125, -0.165283203125, -0.1575927734375, -0.14990234375, -0.1422119140625, -0.134521484375, -0.1268310546875, -0.119140625, -0.1114501953125, -0.103759765625, -0.0960693359375, -0.08837890625, -0.0806884765625, -0.072998046875, -0.0653076171875, -0.0576171875, -0.0499267578125, -0.042236328125, -0.0345458984375, -0.02685546875, -0.0191650390625, -0.011474609375, -0.0037841796875, 0.00390625, 0.0115966796875, 0.019287109375, 0.0269775390625, 0.03466796875, 0.0423583984375, 0.050048828125, 0.0577392578125, 0.0654296875, 0.0731201171875, 0.080810546875, 0.0885009765625, 0.09619140625, 0.1038818359375, 0.111572265625, 0.1192626953125, 0.126953125, 0.1346435546875, 0.142333984375, 0.1500244140625, 0.15771484375, 0.1654052734375, 0.173095703125, 0.1807861328125, 0.1884765625, 0.1961669921875, 0.203857421875, 0.2115478515625, 0.21923828125, 0.2269287109375, 0.234619140625, 0.2423095703125, 0.25, 0.2576904296875, 0.265380859375]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 8.0, 8.0, 5.0, 12.0, 8.0, 18.0, 30.0, 33.0, 28.0, 32.0, 44.0, 34.0, 49.0, 54.0, 56.0, 62.0, 53.0, 48.0, 51.0, 52.0, 44.0, 43.0, 38.0, 36.0, 31.0, 24.0, 23.0, 16.0, 9.0, 16.0, 8.0, 9.0, 6.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.142333984375, -0.1383228302001953, -0.13431167602539062, -0.13030052185058594, -0.12628936767578125, -0.12227821350097656, -0.11826705932617188, -0.11425590515136719, -0.1102447509765625, -0.10623359680175781, -0.10222244262695312, -0.09821128845214844, -0.09420013427734375, -0.09018898010253906, -0.08617782592773438, -0.08216667175292969, -0.078155517578125, -0.07414436340332031, -0.07013320922851562, -0.06612205505371094, -0.06211090087890625, -0.05809974670410156, -0.054088592529296875, -0.05007743835449219, -0.0460662841796875, -0.04205513000488281, -0.038043975830078125, -0.03403282165527344, -0.03002166748046875, -0.026010513305664062, -0.021999359130859375, -0.017988204956054688, -0.01397705078125, -0.009965896606445312, -0.005954742431640625, -0.0019435882568359375, 0.00206756591796875, 0.0060787200927734375, 0.010089874267578125, 0.014101028442382812, 0.0181121826171875, 0.022123336791992188, 0.026134490966796875, 0.030145645141601562, 0.03415679931640625, 0.03816795349121094, 0.042179107666015625, 0.04619026184082031, 0.050201416015625, 0.05421257019042969, 0.058223724365234375, 0.06223487854003906, 0.06624603271484375, 0.07025718688964844, 0.07426834106445312, 0.07827949523925781, 0.0822906494140625, 0.08630180358886719, 0.09031295776367188, 0.09432411193847656, 0.09833526611328125, 0.10234642028808594, 0.10635757446289062, 0.11036872863769531, 0.1143798828125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 5.0, 6.0, 6.0, 10.0, 9.0, 27.0, 27.0, 34.0, 34.0, 63.0, 92.0, 168.0, 230.0, 366.0, 604.0, 1161.0, 2121.0, 4817.0, 11066.0, 29044.0, 94476.0, 525657.0, 2965880.0, 428322.0, 83647.0, 26990.0, 10327.0, 4388.0, 2092.0, 1071.0, 570.0, 346.0, 216.0, 136.0, 72.0, 59.0, 52.0, 25.0, 19.0, 13.0, 12.0, 10.0, 5.0, 7.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.321533203125, -0.3116264343261719, -0.30171966552734375, -0.2918128967285156, -0.2819061279296875, -0.2719993591308594, -0.26209259033203125, -0.2521858215332031, -0.242279052734375, -0.23237228393554688, -0.22246551513671875, -0.21255874633789062, -0.2026519775390625, -0.19274520874023438, -0.18283843994140625, -0.17293167114257812, -0.16302490234375, -0.15311813354492188, -0.14321136474609375, -0.13330459594726562, -0.1233978271484375, -0.11349105834960938, -0.10358428955078125, -0.09367752075195312, -0.083770751953125, -0.07386398315429688, -0.06395721435546875, -0.054050445556640625, -0.0441436767578125, -0.034236907958984375, -0.02433013916015625, -0.014423370361328125, -0.0045166015625, 0.005390167236328125, 0.01529693603515625, 0.025203704833984375, 0.0351104736328125, 0.045017242431640625, 0.05492401123046875, 0.06483078002929688, 0.074737548828125, 0.08464431762695312, 0.09455108642578125, 0.10445785522460938, 0.1143646240234375, 0.12427139282226562, 0.13417816162109375, 0.14408493041992188, 0.15399169921875, 0.16389846801757812, 0.17380523681640625, 0.18371200561523438, 0.1936187744140625, 0.20352554321289062, 0.21343231201171875, 0.22333908081054688, 0.233245849609375, 0.24315261840820312, 0.25305938720703125, 0.2629661560058594, 0.2728729248046875, 0.2827796936035156, 0.29268646240234375, 0.3025932312011719, 0.3125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 4.0, 1.0, 5.0, 6.0, 9.0, 7.0, 17.0, 13.0, 24.0, 28.0, 34.0, 58.0, 76.0, 132.0, 213.0, 375.0, 699.0, 907.0, 618.0, 307.0, 167.0, 119.0, 79.0, 59.0, 28.0, 30.0, 19.0, 15.0, 12.0, 5.0, 3.0, 6.0, 5.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.51171875, -0.4972572326660156, -0.48279571533203125, -0.4683341979980469, -0.4538726806640625, -0.4394111633300781, -0.42494964599609375, -0.4104881286621094, -0.396026611328125, -0.3815650939941406, -0.36710357666015625, -0.3526420593261719, -0.3381805419921875, -0.3237190246582031, -0.30925750732421875, -0.2947959899902344, -0.28033447265625, -0.2658729553222656, -0.25141143798828125, -0.23694992065429688, -0.2224884033203125, -0.20802688598632812, -0.19356536865234375, -0.17910385131835938, -0.164642333984375, -0.15018081665039062, -0.13571929931640625, -0.12125778198242188, -0.1067962646484375, -0.09233474731445312, -0.07787322998046875, -0.06341171264648438, -0.0489501953125, -0.034488677978515625, -0.02002716064453125, -0.005565643310546875, 0.0088958740234375, 0.023357391357421875, 0.03781890869140625, 0.052280426025390625, 0.066741943359375, 0.08120346069335938, 0.09566497802734375, 0.11012649536132812, 0.1245880126953125, 0.13904953002929688, 0.15351104736328125, 0.16797256469726562, 0.18243408203125, 0.19689559936523438, 0.21135711669921875, 0.22581863403320312, 0.2402801513671875, 0.2547416687011719, 0.26920318603515625, 0.2836647033691406, 0.298126220703125, 0.3125877380371094, 0.32704925537109375, 0.3415107727050781, 0.3559722900390625, 0.3704338073730469, 0.38489532470703125, 0.3993568420410156, 0.413818359375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 5.0, 5.0, 4.0, 11.0, 19.0, 41.0, 122.0, 238.0, 248.0, 165.0, 85.0, 29.0, 16.0, 3.0, 6.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.198184013366699, -7.004678726196289, -6.811172962188721, -6.617667198181152, -6.424161911010742, -6.230656623840332, -6.037150859832764, -5.843645095825195, -5.650139808654785, -5.456634521484375, -5.263128757476807, -5.069622993469238, -4.876117706298828, -4.682612419128418, -4.48910665512085, -4.295600891113281, -4.102095603942871, -3.908590078353882, -3.7150845527648926, -3.5215790271759033, -3.328073501586914, -3.134567975997925, -2.9410624504089355, -2.7475569248199463, -2.554051399230957, -2.3605458736419678, -2.1670403480529785, -1.9735348224639893, -1.780029296875, -1.5865237712860107, -1.3930182456970215, -1.1995127201080322, -1.0060076713562012, -0.8125021457672119, -0.6189966201782227, -0.4254910945892334, -0.23198556900024414, -0.03848004341125488, 0.15502548217773438, 0.34853100776672363, 0.5420365333557129, 0.7355420589447021, 0.9290475845336914, 1.1225531101226807, 1.31605863571167, 1.5095641613006592, 1.7030696868896484, 1.8965752124786377, 2.090080738067627, 2.283586263656616, 2.4770917892456055, 2.6705973148345947, 2.864102840423584, 3.0576083660125732, 3.2511138916015625, 3.4446194171905518, 3.638124942779541, 3.8316304683685303, 4.0251359939575195, 4.21864128112793, 4.412147045135498, 4.605652809143066, 4.799158096313477, 4.992663383483887, 5.186169147491455]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 9.0, 9.0, 9.0, 11.0, 15.0, 16.0, 17.0, 27.0, 27.0, 36.0, 40.0, 45.0, 38.0, 56.0, 40.0, 43.0, 57.0, 40.0, 48.0, 54.0, 50.0, 38.0, 41.0, 29.0, 35.0, 30.0, 24.0, 17.0, 19.0, 23.0, 11.0, 7.0, 7.0, 9.0, 8.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0], "bins": [-1.888577938079834, -1.8317358493804932, -1.7748937606811523, -1.718051552772522, -1.6612094640731812, -1.6043673753738403, -1.5475252866744995, -1.4906830787658691, -1.4338409900665283, -1.3769989013671875, -1.3201568126678467, -1.2633146047592163, -1.2064725160598755, -1.1496304273605347, -1.0927883386611938, -1.0359461307525635, -0.9791041016578674, -0.9222620129585266, -0.865419864654541, -0.8085777759552002, -0.7517356276512146, -0.6948935389518738, -0.6380513906478882, -0.5812093019485474, -0.5243672132492065, -0.46752509474754333, -0.4106829762458801, -0.3538408875465393, -0.2969987392425537, -0.2401566505432129, -0.18331453204154968, -0.12647241353988647, -0.06963026523590088, -0.01278815045952797, 0.04405396431684494, 0.10089607536792755, 0.15773819386959076, 0.21458029747009277, 0.271422415971756, 0.3282645344734192, 0.3851066529750824, 0.4419487714767456, 0.4987908899784088, 0.555633008480072, 0.6124750971794128, 0.6693172454833984, 0.7261593341827393, 0.7830014228820801, 0.8398435711860657, 0.8966856598854065, 0.9535278081893921, 1.010369896888733, 1.0672119855880737, 1.124054193496704, 1.180896282196045, 1.2377383708953857, 1.2945804595947266, 1.3514225482940674, 1.4082646369934082, 1.4651068449020386, 1.5219489336013794, 1.5787910223007202, 1.635633111000061, 1.6924753189086914, 1.7493174076080322]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 8.0, 11.0, 11.0, 16.0, 25.0, 31.0, 65.0, 79.0, 104.0, 166.0, 252.0, 322.0, 502.0, 680.0, 1065.0, 1560.0, 2341.0, 3631.0, 5820.0, 9614.0, 16510.0, 29259.0, 57849.0, 142997.0, 381026.0, 224686.0, 79522.0, 37781.0, 20618.0, 11784.0, 7177.0, 4502.0, 2831.0, 1795.0, 1184.0, 838.0, 549.0, 412.0, 263.0, 198.0, 127.0, 97.0, 67.0, 58.0, 36.0, 23.0, 30.0, 15.0, 8.0, 7.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.2406005859375, -0.23276329040527344, -0.22492599487304688, -0.2170886993408203, -0.20925140380859375, -0.2014141082763672, -0.19357681274414062, -0.18573951721191406, -0.1779022216796875, -0.17006492614746094, -0.16222763061523438, -0.1543903350830078, -0.14655303955078125, -0.1387157440185547, -0.13087844848632812, -0.12304115295410156, -0.115203857421875, -0.10736656188964844, -0.09952926635742188, -0.09169197082519531, -0.08385467529296875, -0.07601737976074219, -0.06818008422851562, -0.06034278869628906, -0.0525054931640625, -0.04466819763183594, -0.036830902099609375, -0.028993606567382812, -0.02115631103515625, -0.013319015502929688, -0.005481719970703125, 0.0023555755615234375, 0.01019287109375, 0.018030166625976562, 0.025867462158203125, 0.03370475769042969, 0.04154205322265625, 0.04937934875488281, 0.057216644287109375, 0.06505393981933594, 0.0728912353515625, 0.08072853088378906, 0.08856582641601562, 0.09640312194824219, 0.10424041748046875, 0.11207771301269531, 0.11991500854492188, 0.12775230407714844, 0.135589599609375, 0.14342689514160156, 0.15126419067382812, 0.1591014862060547, 0.16693878173828125, 0.1747760772705078, 0.18261337280273438, 0.19045066833496094, 0.1982879638671875, 0.20612525939941406, 0.21396255493164062, 0.2217998504638672, 0.22963714599609375, 0.2374744415283203, 0.24531173706054688, 0.25314903259277344, 0.260986328125]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 2.0, 6.0, 6.0, 10.0, 4.0, 4.0, 16.0, 6.0, 18.0, 10.0, 20.0, 26.0, 22.0, 35.0, 28.0, 44.0, 44.0, 32.0, 40.0, 41.0, 57.0, 51.0, 33.0, 53.0, 41.0, 46.0, 31.0, 37.0, 42.0, 34.0, 24.0, 25.0, 16.0, 17.0, 16.0, 13.0, 13.0, 12.0, 4.0, 12.0, 7.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11572265625, -0.1121826171875, -0.108642578125, -0.1051025390625, -0.1015625, -0.0980224609375, -0.094482421875, -0.0909423828125, -0.08740234375, -0.0838623046875, -0.080322265625, -0.0767822265625, -0.0732421875, -0.0697021484375, -0.066162109375, -0.0626220703125, -0.05908203125, -0.0555419921875, -0.052001953125, -0.0484619140625, -0.044921875, -0.0413818359375, -0.037841796875, -0.0343017578125, -0.03076171875, -0.0272216796875, -0.023681640625, -0.0201416015625, -0.0166015625, -0.0130615234375, -0.009521484375, -0.0059814453125, -0.00244140625, 0.0010986328125, 0.004638671875, 0.0081787109375, 0.01171875, 0.0152587890625, 0.018798828125, 0.0223388671875, 0.02587890625, 0.0294189453125, 0.032958984375, 0.0364990234375, 0.0400390625, 0.0435791015625, 0.047119140625, 0.0506591796875, 0.05419921875, 0.0577392578125, 0.061279296875, 0.0648193359375, 0.068359375, 0.0718994140625, 0.075439453125, 0.0789794921875, 0.08251953125, 0.0860595703125, 0.089599609375, 0.0931396484375, 0.0966796875, 0.1002197265625, 0.103759765625, 0.1072998046875, 0.11083984375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 10.0, 18.0, 10.0, 14.0, 15.0, 23.0, 29.0, 39.0, 73.0, 87.0, 137.0, 180.0, 298.0, 376.0, 629.0, 1124.0, 2453.0, 6134.0, 22990.0, 155878.0, 767589.0, 68691.0, 13060.0, 4170.0, 1841.0, 978.0, 552.0, 357.0, 234.0, 169.0, 111.0, 75.0, 52.0, 42.0, 29.0, 20.0, 20.0, 13.0, 10.0, 8.0, 6.0, 4.0, 4.0, 4.0, 4.0, 0.0, 0.0, 2.0], "bins": [-0.71875, -0.6989593505859375, -0.679168701171875, -0.6593780517578125, -0.63958740234375, -0.6197967529296875, -0.600006103515625, -0.5802154541015625, -0.5604248046875, -0.5406341552734375, -0.520843505859375, -0.5010528564453125, -0.48126220703125, -0.4614715576171875, -0.441680908203125, -0.4218902587890625, -0.402099609375, -0.3823089599609375, -0.362518310546875, -0.3427276611328125, -0.32293701171875, -0.3031463623046875, -0.283355712890625, -0.2635650634765625, -0.2437744140625, -0.2239837646484375, -0.204193115234375, -0.1844024658203125, -0.16461181640625, -0.1448211669921875, -0.125030517578125, -0.1052398681640625, -0.08544921875, -0.0656585693359375, -0.045867919921875, -0.0260772705078125, -0.00628662109375, 0.0135040283203125, 0.033294677734375, 0.0530853271484375, 0.0728759765625, 0.0926666259765625, 0.112457275390625, 0.1322479248046875, 0.15203857421875, 0.1718292236328125, 0.191619873046875, 0.2114105224609375, 0.231201171875, 0.2509918212890625, 0.270782470703125, 0.2905731201171875, 0.31036376953125, 0.3301544189453125, 0.349945068359375, 0.3697357177734375, 0.3895263671875, 0.4093170166015625, 0.429107666015625, 0.4488983154296875, 0.46868896484375, 0.4884796142578125, 0.508270263671875, 0.5280609130859375, 0.5478515625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 7.0, 4.0, 4.0, 3.0, 11.0, 7.0, 9.0, 4.0, 19.0, 24.0, 19.0, 16.0, 29.0, 28.0, 49.0, 37.0, 41.0, 43.0, 56.0, 53.0, 54.0, 54.0, 50.0, 49.0, 44.0, 49.0, 30.0, 29.0, 27.0, 27.0, 19.0, 25.0, 15.0, 18.0, 13.0, 10.0, 8.0, 11.0, 4.0, 1.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5439453125, -0.5262527465820312, -0.5085601806640625, -0.49086761474609375, -0.473175048828125, -0.45548248291015625, -0.4377899169921875, -0.42009735107421875, -0.40240478515625, -0.38471221923828125, -0.3670196533203125, -0.34932708740234375, -0.331634521484375, -0.31394195556640625, -0.2962493896484375, -0.27855682373046875, -0.2608642578125, -0.24317169189453125, -0.2254791259765625, -0.20778656005859375, -0.190093994140625, -0.17240142822265625, -0.1547088623046875, -0.13701629638671875, -0.11932373046875, -0.10163116455078125, -0.0839385986328125, -0.06624603271484375, -0.048553466796875, -0.03086090087890625, -0.0131683349609375, 0.00452423095703125, 0.022216796875, 0.03990936279296875, 0.0576019287109375, 0.07529449462890625, 0.092987060546875, 0.11067962646484375, 0.1283721923828125, 0.14606475830078125, 0.16375732421875, 0.18144989013671875, 0.1991424560546875, 0.21683502197265625, 0.234527587890625, 0.25222015380859375, 0.2699127197265625, 0.28760528564453125, 0.3052978515625, 0.32299041748046875, 0.3406829833984375, 0.35837554931640625, 0.376068115234375, 0.39376068115234375, 0.4114532470703125, 0.42914581298828125, 0.44683837890625, 0.46453094482421875, 0.4822235107421875, 0.49991607666015625, 0.517608642578125, 0.5353012084960938, 0.5529937744140625, 0.5706863403320312, 0.58837890625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 6.0, 4.0, 7.0, 11.0, 13.0, 12.0, 19.0, 26.0, 41.0, 57.0, 87.0, 177.0, 289.0, 499.0, 1083.0, 2642.0, 7597.0, 29670.0, 195725.0, 710934.0, 75829.0, 15632.0, 4672.0, 1790.0, 777.0, 370.0, 204.0, 130.0, 81.0, 67.0, 36.0, 23.0, 11.0, 18.0, 8.0, 6.0, 7.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2064208984375, -0.1982555389404297, -0.19009017944335938, -0.18192481994628906, -0.17375946044921875, -0.16559410095214844, -0.15742874145507812, -0.1492633819580078, -0.1410980224609375, -0.1329326629638672, -0.12476730346679688, -0.11660194396972656, -0.10843658447265625, -0.10027122497558594, -0.09210586547851562, -0.08394050598144531, -0.075775146484375, -0.06760978698730469, -0.059444427490234375, -0.05127906799316406, -0.04311370849609375, -0.03494834899902344, -0.026782989501953125, -0.018617630004882812, -0.0104522705078125, -0.0022869110107421875, 0.005878448486328125, 0.014043807983398438, 0.02220916748046875, 0.030374526977539062, 0.038539886474609375, 0.04670524597167969, 0.05487060546875, 0.06303596496582031, 0.07120132446289062, 0.07936668395996094, 0.08753204345703125, 0.09569740295410156, 0.10386276245117188, 0.11202812194824219, 0.1201934814453125, 0.1283588409423828, 0.13652420043945312, 0.14468955993652344, 0.15285491943359375, 0.16102027893066406, 0.16918563842773438, 0.1773509979248047, 0.185516357421875, 0.1936817169189453, 0.20184707641601562, 0.21001243591308594, 0.21817779541015625, 0.22634315490722656, 0.23450851440429688, 0.2426738739013672, 0.2508392333984375, 0.2590045928955078, 0.2671699523925781, 0.27533531188964844, 0.28350067138671875, 0.29166603088378906, 0.2998313903808594, 0.3079967498779297, 0.316162109375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 3.0, 6.0, 5.0, 10.0, 9.0, 12.0, 24.0, 34.0, 29.0, 58.0, 66.0, 107.0, 141.0, 140.0, 89.0, 74.0, 43.0, 34.0, 24.0, 15.0, 18.0, 16.0, 17.0, 10.0, 2.0, 9.0, 5.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00014209747314453125, -0.00013854540884494781, -0.00013499334454536438, -0.00013144128024578094, -0.0001278892159461975, -0.00012433715164661407, -0.00012078508734703064, -0.0001172330230474472, -0.00011368095874786377, -0.00011012889444828033, -0.0001065768301486969, -0.00010302476584911346, -9.947270154953003e-05, -9.59206372499466e-05, -9.236857295036316e-05, -8.881650865077972e-05, -8.526444435119629e-05, -8.171238005161285e-05, -7.816031575202942e-05, -7.460825145244598e-05, -7.105618715286255e-05, -6.750412285327911e-05, -6.395205855369568e-05, -6.0399994254112244e-05, -5.684792995452881e-05, -5.3295865654945374e-05, -4.974380135536194e-05, -4.6191737055778503e-05, -4.263967275619507e-05, -3.908760845661163e-05, -3.55355441570282e-05, -3.198347985744476e-05, -2.8431415557861328e-05, -2.4879351258277893e-05, -2.1327286958694458e-05, -1.7775222659111023e-05, -1.4223158359527588e-05, -1.0671094059944153e-05, -7.119029760360718e-06, -3.5669654607772827e-06, -1.4901161193847656e-08, 3.5371631383895874e-06, 7.0892274379730225e-06, 1.0641291737556458e-05, 1.4193356037139893e-05, 1.7745420336723328e-05, 2.1297484636306763e-05, 2.4849548935890198e-05, 2.8401613235473633e-05, 3.195367753505707e-05, 3.55057418346405e-05, 3.905780613422394e-05, 4.260987043380737e-05, 4.616193473339081e-05, 4.971399903297424e-05, 5.326606333255768e-05, 5.681812763214111e-05, 6.037019193172455e-05, 6.392225623130798e-05, 6.747432053089142e-05, 7.102638483047485e-05, 7.457844913005829e-05, 7.813051342964172e-05, 8.168257772922516e-05, 8.52346420288086e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 2.0, 3.0, 3.0, 5.0, 4.0, 13.0, 8.0, 20.0, 34.0, 40.0, 51.0, 71.0, 101.0, 159.0, 220.0, 361.0, 537.0, 922.0, 1819.0, 3688.0, 9116.0, 30644.0, 159637.0, 679870.0, 120699.0, 25332.0, 7899.0, 3240.0, 1640.0, 888.0, 488.0, 343.0, 205.0, 122.0, 98.0, 79.0, 48.0, 41.0, 25.0, 20.0, 16.0, 13.0, 11.0, 7.0, 6.0, 2.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.2413330078125, -0.23432350158691406, -0.22731399536132812, -0.2203044891357422, -0.21329498291015625, -0.2062854766845703, -0.19927597045898438, -0.19226646423339844, -0.1852569580078125, -0.17824745178222656, -0.17123794555664062, -0.1642284393310547, -0.15721893310546875, -0.1502094268798828, -0.14319992065429688, -0.13619041442871094, -0.129180908203125, -0.12217140197753906, -0.11516189575195312, -0.10815238952636719, -0.10114288330078125, -0.09413337707519531, -0.08712387084960938, -0.08011436462402344, -0.0731048583984375, -0.06609535217285156, -0.059085845947265625, -0.05207633972167969, -0.04506683349609375, -0.03805732727050781, -0.031047821044921875, -0.024038314819335938, -0.01702880859375, -0.010019302368164062, -0.003009796142578125, 0.0039997100830078125, 0.01100921630859375, 0.018018722534179688, 0.025028228759765625, 0.03203773498535156, 0.0390472412109375, 0.04605674743652344, 0.053066253662109375, 0.06007575988769531, 0.06708526611328125, 0.07409477233886719, 0.08110427856445312, 0.08811378479003906, 0.095123291015625, 0.10213279724121094, 0.10914230346679688, 0.11615180969238281, 0.12316131591796875, 0.1301708221435547, 0.13718032836914062, 0.14418983459472656, 0.1511993408203125, 0.15820884704589844, 0.16521835327148438, 0.1722278594970703, 0.17923736572265625, 0.1862468719482422, 0.19325637817382812, 0.20026588439941406, 0.207275390625]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 2.0, 6.0, 3.0, 9.0, 11.0, 7.0, 5.0, 9.0, 17.0, 25.0, 27.0, 31.0, 42.0, 44.0, 83.0, 75.0, 99.0, 85.0, 95.0, 87.0, 44.0, 39.0, 35.0, 30.0, 19.0, 13.0, 9.0, 9.0, 9.0, 6.0, 4.0, 9.0, 7.0, 4.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.27490234375, -0.26787757873535156, -0.2608528137207031, -0.2538280487060547, -0.24680328369140625, -0.2397785186767578, -0.23275375366210938, -0.22572898864746094, -0.2187042236328125, -0.21167945861816406, -0.20465469360351562, -0.1976299285888672, -0.19060516357421875, -0.1835803985595703, -0.17655563354492188, -0.16953086853027344, -0.162506103515625, -0.15548133850097656, -0.14845657348632812, -0.1414318084716797, -0.13440704345703125, -0.1273822784423828, -0.12035751342773438, -0.11333274841308594, -0.1063079833984375, -0.09928321838378906, -0.09225845336914062, -0.08523368835449219, -0.07820892333984375, -0.07118415832519531, -0.06415939331054688, -0.05713462829589844, -0.05010986328125, -0.04308509826660156, -0.036060333251953125, -0.029035568237304688, -0.02201080322265625, -0.014986038208007812, -0.007961273193359375, -0.0009365081787109375, 0.0060882568359375, 0.013113021850585938, 0.020137786865234375, 0.027162551879882812, 0.03418731689453125, 0.04121208190917969, 0.048236846923828125, 0.05526161193847656, 0.062286376953125, 0.06931114196777344, 0.07633590698242188, 0.08336067199707031, 0.09038543701171875, 0.09741020202636719, 0.10443496704101562, 0.11145973205566406, 0.1184844970703125, 0.12550926208496094, 0.13253402709960938, 0.1395587921142578, 0.14658355712890625, 0.1536083221435547, 0.16063308715820312, 0.16765785217285156, 0.1746826171875]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 7.0, 5.0, 6.0, 8.0, 17.0, 33.0, 76.0, 111.0, 183.0, 239.0, 135.0, 105.0, 41.0, 19.0, 9.0, 1.0, 4.0, 2.0, 3.0, 1.0, 0.0, 5.0], "bins": [-8.287578582763672, -8.1261568069458, -7.9647345542907715, -7.803312301635742, -7.641890525817871, -7.48046875, -7.319046497344971, -7.157624244689941, -6.99620246887207, -6.834780693054199, -6.67335844039917, -6.511936187744141, -6.3505144119262695, -6.189092636108398, -6.027670383453369, -5.86624813079834, -5.704826354980469, -5.543404579162598, -5.381982326507568, -5.220560073852539, -5.059138298034668, -4.897716522216797, -4.736294269561768, -4.574872016906738, -4.413450241088867, -4.252028465270996, -4.090606212615967, -3.9291841983795166, -3.7677621841430664, -3.606340169906616, -3.444918155670166, -3.283496141433716, -3.122074604034424, -2.9606525897979736, -2.7992305755615234, -2.6378085613250732, -2.476386547088623, -2.314964532852173, -2.1535425186157227, -1.9921205043792725, -1.8306984901428223, -1.669276475906372, -1.5078544616699219, -1.3464324474334717, -1.1850104331970215, -1.0235884189605713, -0.8621664047241211, -0.7007443904876709, -0.5393223762512207, -0.3779003620147705, -0.2164783477783203, -0.05505633354187012, 0.10636568069458008, 0.2677876949310303, 0.42920970916748047, 0.5906317234039307, 0.7520537376403809, 0.913475751876831, 1.0748977661132812, 1.2363197803497314, 1.3977417945861816, 1.5591638088226318, 1.720585823059082, 1.8820078372955322, 2.0434298515319824]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 4.0, 5.0, 6.0, 6.0, 10.0, 10.0, 15.0, 14.0, 22.0, 29.0, 22.0, 35.0, 38.0, 35.0, 35.0, 43.0, 45.0, 49.0, 59.0, 56.0, 48.0, 55.0, 30.0, 58.0, 41.0, 44.0, 35.0, 21.0, 26.0, 23.0, 15.0, 13.0, 13.0, 7.0, 8.0, 7.0, 6.0, 12.0, 1.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.6760222911834717, -2.6025078296661377, -2.5289933681488037, -2.4554789066314697, -2.3819644451141357, -2.3084499835968018, -2.2349355220794678, -2.161421060562134, -2.0879065990448, -2.014392137527466, -1.9408776760101318, -1.8673632144927979, -1.7938487529754639, -1.7203342914581299, -1.646819829940796, -1.573305368423462, -1.499790906906128, -1.426276445388794, -1.35276198387146, -1.279247522354126, -1.205733060836792, -1.132218599319458, -1.058704137802124, -0.98518967628479, -0.911675214767456, -0.8381607532501221, -0.7646462917327881, -0.6911318302154541, -0.6176173686981201, -0.5441029071807861, -0.47058844566345215, -0.39707398414611816, -0.3235592842102051, -0.2500448226928711, -0.1765303611755371, -0.10301589965820312, -0.02950143814086914, 0.044013023376464844, 0.11752748489379883, 0.1910419464111328, 0.2645564079284668, 0.3380708694458008, 0.41158533096313477, 0.48509979248046875, 0.5586142539978027, 0.6321287155151367, 0.7056431770324707, 0.7791576385498047, 0.8526721000671387, 0.9261865615844727, 0.9997010231018066, 1.0732154846191406, 1.1467299461364746, 1.2202444076538086, 1.2937588691711426, 1.3672733306884766, 1.4407877922058105, 1.5143022537231445, 1.5878167152404785, 1.6613311767578125, 1.7348456382751465, 1.8083600997924805, 1.8818745613098145, 1.9553890228271484, 2.0289034843444824]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 5.0, 9.0, 6.0, 8.0, 7.0, 26.0, 21.0, 42.0, 52.0, 96.0, 124.0, 285.0, 1776.0, 207574.0, 3978296.0, 5127.0, 398.0, 163.0, 89.0, 57.0, 34.0, 23.0, 18.0, 15.0, 9.0, 7.0, 4.0, 6.0, 5.0, 1.0, 0.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5712890625, -1.5208740234375, -1.470458984375, -1.4200439453125, -1.36962890625, -1.3192138671875, -1.268798828125, -1.2183837890625, -1.16796875, -1.1175537109375, -1.067138671875, -1.0167236328125, -0.96630859375, -0.9158935546875, -0.865478515625, -0.8150634765625, -0.7646484375, -0.7142333984375, -0.663818359375, -0.6134033203125, -0.56298828125, -0.5125732421875, -0.462158203125, -0.4117431640625, -0.361328125, -0.3109130859375, -0.260498046875, -0.2100830078125, -0.15966796875, -0.1092529296875, -0.058837890625, -0.0084228515625, 0.0419921875, 0.0924072265625, 0.142822265625, 0.1932373046875, 0.24365234375, 0.2940673828125, 0.344482421875, 0.3948974609375, 0.4453125, 0.4957275390625, 0.546142578125, 0.5965576171875, 0.64697265625, 0.6973876953125, 0.747802734375, 0.7982177734375, 0.8486328125, 0.8990478515625, 0.949462890625, 0.9998779296875, 1.05029296875, 1.1007080078125, 1.151123046875, 1.2015380859375, 1.251953125, 1.3023681640625, 1.352783203125, 1.4031982421875, 1.45361328125, 1.5040283203125, 1.554443359375, 1.6048583984375, 1.6552734375]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 5.0, 0.0, 4.0, 3.0, 5.0, 8.0, 13.0, 7.0, 11.0, 10.0, 23.0, 23.0, 19.0, 34.0, 27.0, 45.0, 40.0, 47.0, 45.0, 48.0, 53.0, 43.0, 47.0, 40.0, 50.0, 42.0, 43.0, 41.0, 30.0, 31.0, 32.0, 24.0, 14.0, 24.0, 18.0, 12.0, 15.0, 5.0, 8.0, 7.0, 5.0, 1.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.12139892578125, -0.11770820617675781, -0.11401748657226562, -0.11032676696777344, -0.10663604736328125, -0.10294532775878906, -0.09925460815429688, -0.09556388854980469, -0.0918731689453125, -0.08818244934082031, -0.08449172973632812, -0.08080101013183594, -0.07711029052734375, -0.07341957092285156, -0.06972885131835938, -0.06603813171386719, -0.062347412109375, -0.05865669250488281, -0.054965972900390625, -0.05127525329589844, -0.04758453369140625, -0.04389381408691406, -0.040203094482421875, -0.03651237487792969, -0.0328216552734375, -0.029130935668945312, -0.025440216064453125, -0.021749496459960938, -0.01805877685546875, -0.014368057250976562, -0.010677337646484375, -0.0069866180419921875, -0.0032958984375, 0.0003948211669921875, 0.004085540771484375, 0.0077762603759765625, 0.01146697998046875, 0.015157699584960938, 0.018848419189453125, 0.022539138793945312, 0.0262298583984375, 0.029920578002929688, 0.033611297607421875, 0.03730201721191406, 0.04099273681640625, 0.04468345642089844, 0.048374176025390625, 0.05206489562988281, 0.055755615234375, 0.05944633483886719, 0.06313705444335938, 0.06682777404785156, 0.07051849365234375, 0.07420921325683594, 0.07789993286132812, 0.08159065246582031, 0.0852813720703125, 0.08897209167480469, 0.09266281127929688, 0.09635353088378906, 0.10004425048828125, 0.10373497009277344, 0.10742568969726562, 0.11111640930175781, 0.11480712890625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 6.0, 8.0, 16.0, 19.0, 43.0, 70.0, 101.0, 185.0, 351.0, 674.0, 1463.0, 3237.0, 7645.0, 22158.0, 85202.0, 601673.0, 3026407.0, 352020.0, 63521.0, 18240.0, 6377.0, 2609.0, 1148.0, 525.0, 266.0, 126.0, 80.0, 41.0, 23.0, 21.0, 10.0, 7.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.412841796875, -0.40149688720703125, -0.3901519775390625, -0.37880706787109375, -0.367462158203125, -0.35611724853515625, -0.3447723388671875, -0.33342742919921875, -0.32208251953125, -0.31073760986328125, -0.2993927001953125, -0.28804779052734375, -0.276702880859375, -0.26535797119140625, -0.2540130615234375, -0.24266815185546875, -0.2313232421875, -0.21997833251953125, -0.2086334228515625, -0.19728851318359375, -0.185943603515625, -0.17459869384765625, -0.1632537841796875, -0.15190887451171875, -0.14056396484375, -0.12921905517578125, -0.1178741455078125, -0.10652923583984375, -0.095184326171875, -0.08383941650390625, -0.0724945068359375, -0.06114959716796875, -0.0498046875, -0.03845977783203125, -0.0271148681640625, -0.01576995849609375, -0.004425048828125, 0.00691986083984375, 0.0182647705078125, 0.02960968017578125, 0.04095458984375, 0.05229949951171875, 0.0636444091796875, 0.07498931884765625, 0.086334228515625, 0.09767913818359375, 0.1090240478515625, 0.12036895751953125, 0.1317138671875, 0.14305877685546875, 0.1544036865234375, 0.16574859619140625, 0.177093505859375, 0.18843841552734375, 0.1997833251953125, 0.21112823486328125, 0.22247314453125, 0.23381805419921875, 0.2451629638671875, 0.25650787353515625, 0.267852783203125, 0.27919769287109375, 0.2905426025390625, 0.30188751220703125, 0.313232421875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 5.0, 0.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 6.0, 5.0, 12.0, 7.0, 11.0, 17.0, 21.0, 37.0, 33.0, 56.0, 88.0, 141.0, 194.0, 300.0, 518.0, 702.0, 644.0, 437.0, 257.0, 159.0, 110.0, 74.0, 60.0, 39.0, 28.0, 18.0, 20.0, 13.0, 15.0, 18.0, 7.0, 6.0, 7.0, 5.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.411376953125, -0.40019989013671875, -0.3890228271484375, -0.37784576416015625, -0.366668701171875, -0.35549163818359375, -0.3443145751953125, -0.33313751220703125, -0.32196044921875, -0.31078338623046875, -0.2996063232421875, -0.28842926025390625, -0.277252197265625, -0.26607513427734375, -0.2548980712890625, -0.24372100830078125, -0.2325439453125, -0.22136688232421875, -0.2101898193359375, -0.19901275634765625, -0.187835693359375, -0.17665863037109375, -0.1654815673828125, -0.15430450439453125, -0.14312744140625, -0.13195037841796875, -0.1207733154296875, -0.10959625244140625, -0.098419189453125, -0.08724212646484375, -0.0760650634765625, -0.06488800048828125, -0.0537109375, -0.04253387451171875, -0.0313568115234375, -0.02017974853515625, -0.009002685546875, 0.00217437744140625, 0.0133514404296875, 0.02452850341796875, 0.03570556640625, 0.04688262939453125, 0.0580596923828125, 0.06923675537109375, 0.080413818359375, 0.09159088134765625, 0.1027679443359375, 0.11394500732421875, 0.1251220703125, 0.13629913330078125, 0.1474761962890625, 0.15865325927734375, 0.169830322265625, 0.18100738525390625, 0.1921844482421875, 0.20336151123046875, 0.21453857421875, 0.22571563720703125, 0.2368927001953125, 0.24806976318359375, 0.259246826171875, 0.27042388916015625, 0.2816009521484375, 0.29277801513671875, 0.303955078125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 11.0, 24.0, 53.0, 102.0, 208.0, 232.0, 194.0, 91.0, 40.0, 14.0, 12.0, 8.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.134166717529297, -4.979875564575195, -4.825584411621094, -4.67129373550415, -4.517002582550049, -4.362711429595947, -4.208420276641846, -4.054129600524902, -3.899838447570801, -3.745547294616699, -3.5912563800811768, -3.436965227127075, -3.2826743125915527, -3.128383159637451, -2.9740920066833496, -2.819801092147827, -2.6655099391937256, -2.511218786239624, -2.3569278717041016, -2.20263671875, -2.0483458042144775, -1.894054651260376, -1.739763617515564, -1.585472583770752, -1.43118155002594, -1.276890516281128, -1.122599482536316, -0.9683083891868591, -0.8140173554420471, -0.6597263216972351, -0.5054352283477783, -0.3511441946029663, -0.1968531608581543, -0.04256211221218109, 0.11172893643379211, 0.2660199999809265, 0.4203110337257385, 0.5746020674705505, 0.7288931608200073, 0.8831841945648193, 1.0374752283096313, 1.1917662620544434, 1.3460572957992554, 1.5003483295440674, 1.654639482498169, 1.8089303970336914, 1.963221549987793, 2.1175127029418945, 2.271803617477417, 2.4260947704315186, 2.580385684967041, 2.7346768379211426, 2.888967752456665, 3.0432589054107666, 3.197549819946289, 3.3518409729003906, 3.506132125854492, 3.6604232788085938, 3.814714193344116, 3.9690053462982178, 4.12329626083374, 4.277587413787842, 4.431878566741943, 4.586169242858887, 4.740460395812988]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 6.0, 2.0, 7.0, 8.0, 7.0, 5.0, 8.0, 12.0, 10.0, 13.0, 13.0, 28.0, 20.0, 25.0, 22.0, 36.0, 29.0, 25.0, 41.0, 30.0, 32.0, 46.0, 41.0, 38.0, 37.0, 38.0, 28.0, 29.0, 42.0, 38.0, 30.0, 28.0, 26.0, 25.0, 25.0, 18.0, 23.0, 17.0, 10.0, 15.0, 7.0, 10.0, 11.0, 6.0, 5.0, 9.0, 11.0, 6.0, 6.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0], "bins": [-1.3456482887268066, -1.3037354946136475, -1.2618228197097778, -1.2199100255966187, -1.177997350692749, -1.1360845565795898, -1.0941717624664307, -1.052259087562561, -1.0103462934494019, -0.9684335589408875, -0.926520824432373, -0.8846080303192139, -0.8426952958106995, -0.8007825613021851, -0.7588698267936707, -0.7169570922851562, -0.6750443577766418, -0.6331316232681274, -0.591218888759613, -0.5493061542510986, -0.5073933601379395, -0.46548062562942505, -0.42356789112091064, -0.38165512681007385, -0.33974239230155945, -0.29782965779304504, -0.25591689348220825, -0.21400415897369385, -0.17209140956401825, -0.13017866015434265, -0.08826592564582825, -0.046353161334991455, -0.004440426826477051, 0.03747231885790825, 0.07938506454229355, 0.12129780650138855, 0.16321055591106415, 0.20512330532073975, 0.24703603982925415, 0.28894880414009094, 0.33086153864860535, 0.37277427315711975, 0.41468703746795654, 0.45659977197647095, 0.49851250648498535, 0.5404253005981445, 0.5823379755020142, 0.6242507696151733, 0.6661635041236877, 0.7080762386322021, 0.7499889731407166, 0.791901707649231, 0.8338145017623901, 0.8757272362709045, 0.917639970779419, 0.9595527648925781, 1.0014654397964478, 1.043378233909607, 1.0852909088134766, 1.1272037029266357, 1.1691163778305054, 1.2110291719436646, 1.2529418468475342, 1.2948546409606934, 1.3367674350738525]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 0.0, 2.0, 4.0, 7.0, 5.0, 8.0, 8.0, 13.0, 14.0, 22.0, 25.0, 44.0, 55.0, 80.0, 142.0, 164.0, 251.0, 364.0, 488.0, 737.0, 1056.0, 1598.0, 2583.0, 4064.0, 6603.0, 11168.0, 20298.0, 39289.0, 94038.0, 274791.0, 354801.0, 127284.0, 50026.0, 24126.0, 13141.0, 7751.0, 4818.0, 2924.0, 1855.0, 1249.0, 805.0, 598.0, 361.0, 277.0, 195.0, 130.0, 84.0, 58.0, 39.0, 38.0, 20.0, 19.0, 15.0, 9.0, 12.0, 5.0, 4.0, 1.0, 2.0, 1.0], "bins": [-0.245361328125, -0.2381763458251953, -0.23099136352539062, -0.22380638122558594, -0.21662139892578125, -0.20943641662597656, -0.20225143432617188, -0.1950664520263672, -0.1878814697265625, -0.1806964874267578, -0.17351150512695312, -0.16632652282714844, -0.15914154052734375, -0.15195655822753906, -0.14477157592773438, -0.1375865936279297, -0.130401611328125, -0.12321662902832031, -0.11603164672851562, -0.10884666442871094, -0.10166168212890625, -0.09447669982910156, -0.08729171752929688, -0.08010673522949219, -0.0729217529296875, -0.06573677062988281, -0.058551788330078125, -0.05136680603027344, -0.04418182373046875, -0.03699684143066406, -0.029811859130859375, -0.022626876831054688, -0.01544189453125, -0.008256912231445312, -0.001071929931640625, 0.0061130523681640625, 0.01329803466796875, 0.020483016967773438, 0.027667999267578125, 0.03485298156738281, 0.0420379638671875, 0.04922294616699219, 0.056407928466796875, 0.06359291076660156, 0.07077789306640625, 0.07796287536621094, 0.08514785766601562, 0.09233283996582031, 0.099517822265625, 0.10670280456542969, 0.11388778686523438, 0.12107276916503906, 0.12825775146484375, 0.13544273376464844, 0.14262771606445312, 0.1498126983642578, 0.1569976806640625, 0.1641826629638672, 0.17136764526367188, 0.17855262756347656, 0.18573760986328125, 0.19292259216308594, 0.20010757446289062, 0.2072925567626953, 0.2144775390625]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 6.0, 7.0, 7.0, 7.0, 11.0, 12.0, 15.0, 18.0, 29.0, 23.0, 27.0, 33.0, 31.0, 30.0, 42.0, 41.0, 38.0, 49.0, 45.0, 46.0, 44.0, 43.0, 43.0, 36.0, 49.0, 39.0, 21.0, 21.0, 29.0, 24.0, 30.0, 24.0, 21.0, 14.0, 13.0, 10.0, 4.0, 6.0, 3.0, 4.0, 2.0, 5.0, 0.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.11163330078125, -0.1077280044555664, -0.10382270812988281, -0.09991741180419922, -0.09601211547851562, -0.09210681915283203, -0.08820152282714844, -0.08429622650146484, -0.08039093017578125, -0.07648563385009766, -0.07258033752441406, -0.06867504119873047, -0.06476974487304688, -0.06086444854736328, -0.05695915222167969, -0.053053855895996094, -0.0491485595703125, -0.045243263244628906, -0.04133796691894531, -0.03743267059326172, -0.033527374267578125, -0.02962207794189453, -0.025716781616210938, -0.021811485290527344, -0.01790618896484375, -0.014000892639160156, -0.010095596313476562, -0.006190299987792969, -0.002285003662109375, 0.0016202926635742188, 0.0055255889892578125, 0.009430885314941406, 0.013336181640625, 0.017241477966308594, 0.021146774291992188, 0.02505207061767578, 0.028957366943359375, 0.03286266326904297, 0.03676795959472656, 0.040673255920410156, 0.04457855224609375, 0.048483848571777344, 0.05238914489746094, 0.05629444122314453, 0.060199737548828125, 0.06410503387451172, 0.06801033020019531, 0.0719156265258789, 0.0758209228515625, 0.0797262191772461, 0.08363151550292969, 0.08753681182861328, 0.09144210815429688, 0.09534740447998047, 0.09925270080566406, 0.10315799713134766, 0.10706329345703125, 0.11096858978271484, 0.11487388610839844, 0.11877918243408203, 0.12268447875976562, 0.12658977508544922, 0.1304950714111328, 0.1344003677368164, 0.1383056640625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 2.0, 4.0, 2.0, 3.0, 2.0, 1.0, 6.0, 13.0, 12.0, 12.0, 18.0, 18.0, 34.0, 47.0, 63.0, 83.0, 118.0, 200.0, 342.0, 528.0, 1004.0, 1938.0, 4640.0, 13609.0, 52593.0, 563770.0, 346834.0, 43197.0, 11394.0, 4044.0, 1681.0, 959.0, 487.0, 292.0, 183.0, 122.0, 86.0, 63.0, 42.0, 27.0, 25.0, 10.0, 14.0, 10.0, 8.0, 6.0, 6.0, 2.0, 2.0, 2.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.482177734375, -0.4655113220214844, -0.44884490966796875, -0.4321784973144531, -0.4155120849609375, -0.3988456726074219, -0.38217926025390625, -0.3655128479003906, -0.348846435546875, -0.3321800231933594, -0.31551361083984375, -0.2988471984863281, -0.2821807861328125, -0.2655143737792969, -0.24884796142578125, -0.23218154907226562, -0.21551513671875, -0.19884872436523438, -0.18218231201171875, -0.16551589965820312, -0.1488494873046875, -0.13218307495117188, -0.11551666259765625, -0.09885025024414062, -0.082183837890625, -0.06551742553710938, -0.04885101318359375, -0.032184600830078125, -0.0155181884765625, 0.001148223876953125, 0.01781463623046875, 0.034481048583984375, 0.0511474609375, 0.06781387329101562, 0.08448028564453125, 0.10114669799804688, 0.1178131103515625, 0.13447952270507812, 0.15114593505859375, 0.16781234741210938, 0.184478759765625, 0.20114517211914062, 0.21781158447265625, 0.23447799682617188, 0.2511444091796875, 0.2678108215332031, 0.28447723388671875, 0.3011436462402344, 0.31781005859375, 0.3344764709472656, 0.35114288330078125, 0.3678092956542969, 0.3844757080078125, 0.4011421203613281, 0.41780853271484375, 0.4344749450683594, 0.451141357421875, 0.4678077697753906, 0.48447418212890625, 0.5011405944824219, 0.5178070068359375, 0.5344734191894531, 0.5511398315429688, 0.5678062438964844, 0.58447265625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 6.0, 9.0, 10.0, 6.0, 8.0, 10.0, 18.0, 15.0, 17.0, 31.0, 32.0, 40.0, 50.0, 53.0, 44.0, 50.0, 60.0, 56.0, 63.0, 43.0, 63.0, 31.0, 42.0, 42.0, 36.0, 35.0, 26.0, 23.0, 16.0, 17.0, 15.0, 11.0, 9.0, 7.0, 0.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6650390625, -0.644622802734375, -0.62420654296875, -0.603790283203125, -0.5833740234375, -0.562957763671875, -0.54254150390625, -0.522125244140625, -0.501708984375, -0.481292724609375, -0.46087646484375, -0.440460205078125, -0.4200439453125, -0.399627685546875, -0.37921142578125, -0.358795166015625, -0.33837890625, -0.317962646484375, -0.29754638671875, -0.277130126953125, -0.2567138671875, -0.236297607421875, -0.21588134765625, -0.195465087890625, -0.175048828125, -0.154632568359375, -0.13421630859375, -0.113800048828125, -0.0933837890625, -0.072967529296875, -0.05255126953125, -0.032135009765625, -0.01171875, 0.008697509765625, 0.02911376953125, 0.049530029296875, 0.0699462890625, 0.090362548828125, 0.11077880859375, 0.131195068359375, 0.151611328125, 0.172027587890625, 0.19244384765625, 0.212860107421875, 0.2332763671875, 0.253692626953125, 0.27410888671875, 0.294525146484375, 0.31494140625, 0.335357666015625, 0.35577392578125, 0.376190185546875, 0.3966064453125, 0.417022705078125, 0.43743896484375, 0.457855224609375, 0.478271484375, 0.498687744140625, 0.51910400390625, 0.539520263671875, 0.5599365234375, 0.580352783203125, 0.60076904296875, 0.621185302734375, 0.6416015625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 4.0, 2.0, 5.0, 12.0, 9.0, 14.0, 19.0, 28.0, 41.0, 69.0, 130.0, 304.0, 784.0, 3050.0, 20099.0, 372471.0, 621624.0, 24686.0, 3626.0, 920.0, 326.0, 135.0, 70.0, 43.0, 28.0, 17.0, 12.0, 8.0, 8.0, 3.0, 5.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.361328125, -0.3474578857421875, -0.333587646484375, -0.3197174072265625, -0.30584716796875, -0.2919769287109375, -0.278106689453125, -0.2642364501953125, -0.2503662109375, -0.2364959716796875, -0.222625732421875, -0.2087554931640625, -0.19488525390625, -0.1810150146484375, -0.167144775390625, -0.1532745361328125, -0.139404296875, -0.1255340576171875, -0.111663818359375, -0.0977935791015625, -0.08392333984375, -0.0700531005859375, -0.056182861328125, -0.0423126220703125, -0.0284423828125, -0.0145721435546875, -0.000701904296875, 0.0131683349609375, 0.02703857421875, 0.0409088134765625, 0.054779052734375, 0.0686492919921875, 0.08251953125, 0.0963897705078125, 0.110260009765625, 0.1241302490234375, 0.13800048828125, 0.1518707275390625, 0.165740966796875, 0.1796112060546875, 0.1934814453125, 0.2073516845703125, 0.221221923828125, 0.2350921630859375, 0.24896240234375, 0.2628326416015625, 0.276702880859375, 0.2905731201171875, 0.304443359375, 0.3183135986328125, 0.332183837890625, 0.3460540771484375, 0.35992431640625, 0.3737945556640625, 0.387664794921875, 0.4015350341796875, 0.4154052734375, 0.4292755126953125, 0.443145751953125, 0.4570159912109375, 0.47088623046875, 0.4847564697265625, 0.498626708984375, 0.5124969482421875, 0.5263671875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 2.0, 6.0, 6.0, 10.0, 10.0, 9.0, 13.0, 11.0, 23.0, 19.0, 32.0, 46.0, 41.0, 76.0, 85.0, 105.0, 84.0, 100.0, 65.0, 55.0, 55.0, 26.0, 27.0, 16.0, 14.0, 9.0, 13.0, 10.0, 5.0, 5.0, 2.0, 3.0, 8.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.557868957519531e-05, -7.329694926738739e-05, -7.101520895957947e-05, -6.873346865177155e-05, -6.645172834396362e-05, -6.41699880361557e-05, -6.188824772834778e-05, -5.9606507420539856e-05, -5.7324767112731934e-05, -5.504302680492401e-05, -5.276128649711609e-05, -5.0479546189308167e-05, -4.8197805881500244e-05, -4.591606557369232e-05, -4.36343252658844e-05, -4.135258495807648e-05, -3.9070844650268555e-05, -3.678910434246063e-05, -3.450736403465271e-05, -3.222562372684479e-05, -2.9943883419036865e-05, -2.7662143111228943e-05, -2.538040280342102e-05, -2.3098662495613098e-05, -2.0816922187805176e-05, -1.8535181879997253e-05, -1.625344157218933e-05, -1.3971701264381409e-05, -1.1689960956573486e-05, -9.408220648765564e-06, -7.126480340957642e-06, -4.844740033149719e-06, -2.562999725341797e-06, -2.812594175338745e-07, 2.000480890274048e-06, 4.28222119808197e-06, 6.563961505889893e-06, 8.845701813697815e-06, 1.1127442121505737e-05, 1.340918242931366e-05, 1.5690922737121582e-05, 1.7972663044929504e-05, 2.0254403352737427e-05, 2.253614366054535e-05, 2.481788396835327e-05, 2.7099624276161194e-05, 2.9381364583969116e-05, 3.166310489177704e-05, 3.394484519958496e-05, 3.622658550739288e-05, 3.8508325815200806e-05, 4.079006612300873e-05, 4.307180643081665e-05, 4.535354673862457e-05, 4.7635287046432495e-05, 4.991702735424042e-05, 5.219876766204834e-05, 5.448050796985626e-05, 5.6762248277664185e-05, 5.904398858547211e-05, 6.132572889328003e-05, 6.360746920108795e-05, 6.588920950889587e-05, 6.81709498167038e-05, 7.045269012451172e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 5.0, 5.0, 3.0, 6.0, 8.0, 14.0, 25.0, 40.0, 49.0, 64.0, 124.0, 218.0, 524.0, 1144.0, 2943.0, 9826.0, 68873.0, 836388.0, 109679.0, 12603.0, 3509.0, 1349.0, 553.0, 247.0, 144.0, 78.0, 45.0, 37.0, 25.0, 8.0, 5.0, 2.0, 9.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.367431640625, -0.35457611083984375, -0.3417205810546875, -0.32886505126953125, -0.316009521484375, -0.30315399169921875, -0.2902984619140625, -0.27744293212890625, -0.26458740234375, -0.25173187255859375, -0.2388763427734375, -0.22602081298828125, -0.213165283203125, -0.20030975341796875, -0.1874542236328125, -0.17459869384765625, -0.1617431640625, -0.14888763427734375, -0.1360321044921875, -0.12317657470703125, -0.110321044921875, -0.09746551513671875, -0.0846099853515625, -0.07175445556640625, -0.05889892578125, -0.04604339599609375, -0.0331878662109375, -0.02033233642578125, -0.007476806640625, 0.00537872314453125, 0.0182342529296875, 0.03108978271484375, 0.0439453125, 0.05680084228515625, 0.0696563720703125, 0.08251190185546875, 0.095367431640625, 0.10822296142578125, 0.1210784912109375, 0.13393402099609375, 0.14678955078125, 0.15964508056640625, 0.1725006103515625, 0.18535614013671875, 0.198211669921875, 0.21106719970703125, 0.2239227294921875, 0.23677825927734375, 0.2496337890625, 0.26248931884765625, 0.2753448486328125, 0.28820037841796875, 0.301055908203125, 0.31391143798828125, 0.3267669677734375, 0.33962249755859375, 0.35247802734375, 0.36533355712890625, 0.3781890869140625, 0.39104461669921875, 0.403900146484375, 0.41675567626953125, 0.4296112060546875, 0.44246673583984375, 0.455322265625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 5.0, 0.0, 2.0, 5.0, 6.0, 5.0, 8.0, 11.0, 21.0, 10.0, 25.0, 29.0, 42.0, 50.0, 54.0, 72.0, 85.0, 100.0, 86.0, 73.0, 65.0, 49.0, 53.0, 35.0, 27.0, 18.0, 12.0, 16.0, 10.0, 4.0, 5.0, 4.0, 3.0, 1.0, 4.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.260009765625, -0.25267601013183594, -0.24534225463867188, -0.2380084991455078, -0.23067474365234375, -0.2233409881591797, -0.21600723266601562, -0.20867347717285156, -0.2013397216796875, -0.19400596618652344, -0.18667221069335938, -0.1793384552001953, -0.17200469970703125, -0.1646709442138672, -0.15733718872070312, -0.15000343322753906, -0.142669677734375, -0.13533592224121094, -0.12800216674804688, -0.12066841125488281, -0.11333465576171875, -0.10600090026855469, -0.09866714477539062, -0.09133338928222656, -0.0839996337890625, -0.07666587829589844, -0.06933212280273438, -0.06199836730957031, -0.05466461181640625, -0.04733085632324219, -0.039997100830078125, -0.03266334533691406, -0.02532958984375, -0.017995834350585938, -0.010662078857421875, -0.0033283233642578125, 0.00400543212890625, 0.011339187622070312, 0.018672943115234375, 0.026006698608398438, 0.0333404541015625, 0.04067420959472656, 0.048007965087890625, 0.05534172058105469, 0.06267547607421875, 0.07000923156738281, 0.07734298706054688, 0.08467674255371094, 0.092010498046875, 0.09934425354003906, 0.10667800903320312, 0.11401176452636719, 0.12134552001953125, 0.1286792755126953, 0.13601303100585938, 0.14334678649902344, 0.1506805419921875, 0.15801429748535156, 0.16534805297851562, 0.1726818084716797, 0.18001556396484375, 0.1873493194580078, 0.19468307495117188, 0.20201683044433594, 0.2093505859375]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 1.0, 4.0, 4.0, 9.0, 10.0, 27.0, 62.0, 119.0, 264.0, 256.0, 139.0, 63.0, 18.0, 8.0, 7.0, 6.0, 2.0, 1.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.128609657287598, -3.9339144229888916, -3.7392191886901855, -3.5445239543914795, -3.3498287200927734, -3.1551334857940674, -2.9604382514953613, -2.7657430171966553, -2.571047782897949, -2.376352548599243, -2.181657314300537, -1.986962080001831, -1.792266845703125, -1.597571611404419, -1.402876377105713, -1.2081811428070068, -1.0134859085083008, -0.8187906742095947, -0.6240954399108887, -0.4294002056121826, -0.23470497131347656, -0.04000973701477051, 0.15468549728393555, 0.3493807315826416, 0.5440759658813477, 0.7387712001800537, 0.9334664344787598, 1.1281616687774658, 1.3228569030761719, 1.517552137374878, 1.712247371673584, 1.90694260597229, 2.101637840270996, 2.296333074569702, 2.491028308868408, 2.6857235431671143, 2.8804187774658203, 3.0751140117645264, 3.2698092460632324, 3.4645044803619385, 3.6591997146606445, 3.8538949489593506, 4.048590183258057, 4.243285179138184, 4.437980651855469, 4.632676124572754, 4.827371120452881, 5.022066116333008, 5.216761589050293, 5.411457061767578, 5.606152057647705, 5.800847053527832, 5.995542526245117, 6.190237998962402, 6.384932994842529, 6.579627990722656, 6.774323463439941, 6.969018936157227, 7.1637139320373535, 7.3584089279174805, 7.553104400634766, 7.747799873352051, 7.942494869232178, 8.137189865112305, 8.33188533782959]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 6.0, 13.0, 13.0, 10.0, 16.0, 14.0, 17.0, 18.0, 20.0, 26.0, 33.0, 39.0, 42.0, 30.0, 46.0, 52.0, 69.0, 71.0, 75.0, 62.0, 37.0, 40.0, 42.0, 36.0, 30.0, 25.0, 27.0, 23.0, 10.0, 15.0, 7.0, 16.0, 11.0, 2.0, 3.0, 7.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.73716139793396, -2.6523704528808594, -2.5675792694091797, -2.4827880859375, -2.3979971408843994, -2.313206195831299, -2.228415012359619, -2.1436238288879395, -2.058832883834839, -1.9740418195724487, -1.8892507553100586, -1.8044596910476685, -1.7196686267852783, -1.6348775625228882, -1.550086498260498, -1.465295433998108, -1.3805043697357178, -1.2957133054733276, -1.2109222412109375, -1.1261311769485474, -1.0413401126861572, -0.9565490484237671, -0.871757984161377, -0.7869669198989868, -0.7021758556365967, -0.6173847913742065, -0.5325937271118164, -0.44780266284942627, -0.36301159858703613, -0.278220534324646, -0.19342947006225586, -0.10863840579986572, -0.023847579956054688, 0.06094348430633545, 0.14573454856872559, 0.23052561283111572, 0.31531667709350586, 0.400107741355896, 0.48489880561828613, 0.5696898698806763, 0.6544809341430664, 0.7392719984054565, 0.8240630626678467, 0.9088541269302368, 0.993645191192627, 1.078436255455017, 1.1632273197174072, 1.2480183839797974, 1.3328094482421875, 1.4176005125045776, 1.5023915767669678, 1.587182641029358, 1.671973705291748, 1.7567647695541382, 1.8415558338165283, 1.9263468980789185, 2.0111379623413086, 2.0959291458129883, 2.180720090866089, 2.2655110359191895, 2.350302219390869, 2.435093402862549, 2.5198843479156494, 2.60467529296875, 2.6894664764404297]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 1.0, 10.0, 5.0, 5.0, 8.0, 8.0, 18.0, 18.0, 39.0, 42.0, 87.0, 175.0, 346.0, 764.0, 1654.0, 3947.0, 10492.0, 30552.0, 110568.0, 638063.0, 2546574.0, 683440.0, 117942.0, 32015.0, 10520.0, 3939.0, 1605.0, 676.0, 325.0, 201.0, 88.0, 52.0, 38.0, 25.0, 18.0, 12.0, 5.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.31201171875, -0.3039112091064453, -0.2958106994628906, -0.28771018981933594, -0.27960968017578125, -0.27150917053222656, -0.2634086608886719, -0.2553081512451172, -0.2472076416015625, -0.2391071319580078, -0.23100662231445312, -0.22290611267089844, -0.21480560302734375, -0.20670509338378906, -0.19860458374023438, -0.1905040740966797, -0.182403564453125, -0.1743030548095703, -0.16620254516601562, -0.15810203552246094, -0.15000152587890625, -0.14190101623535156, -0.13380050659179688, -0.1256999969482422, -0.1175994873046875, -0.10949897766113281, -0.10139846801757812, -0.09329795837402344, -0.08519744873046875, -0.07709693908691406, -0.06899642944335938, -0.06089591979980469, -0.05279541015625, -0.04469490051269531, -0.036594390869140625, -0.028493881225585938, -0.02039337158203125, -0.012292861938476562, -0.004192352294921875, 0.0039081573486328125, 0.0120086669921875, 0.020109176635742188, 0.028209686279296875, 0.03631019592285156, 0.04441070556640625, 0.05251121520996094, 0.060611724853515625, 0.06871223449707031, 0.076812744140625, 0.08491325378417969, 0.09301376342773438, 0.10111427307128906, 0.10921478271484375, 0.11731529235839844, 0.12541580200195312, 0.1335163116455078, 0.1416168212890625, 0.1497173309326172, 0.15781784057617188, 0.16591835021972656, 0.17401885986328125, 0.18211936950683594, 0.19021987915039062, 0.1983203887939453, 0.2064208984375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 3.0, 7.0, 6.0, 7.0, 7.0, 9.0, 17.0, 10.0, 16.0, 34.0, 20.0, 22.0, 23.0, 34.0, 28.0, 39.0, 35.0, 49.0, 52.0, 40.0, 58.0, 45.0, 55.0, 33.0, 43.0, 54.0, 36.0, 35.0, 28.0, 21.0, 21.0, 27.0, 19.0, 18.0, 8.0, 13.0, 10.0, 4.0, 6.0, 2.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1265869140625, -0.1228036880493164, -0.11902046203613281, -0.11523723602294922, -0.11145401000976562, -0.10767078399658203, -0.10388755798339844, -0.10010433197021484, -0.09632110595703125, -0.09253787994384766, -0.08875465393066406, -0.08497142791748047, -0.08118820190429688, -0.07740497589111328, -0.07362174987792969, -0.0698385238647461, -0.0660552978515625, -0.062272071838378906, -0.05848884582519531, -0.05470561981201172, -0.050922393798828125, -0.04713916778564453, -0.04335594177246094, -0.039572715759277344, -0.03578948974609375, -0.032006263732910156, -0.028223037719726562, -0.02443981170654297, -0.020656585693359375, -0.01687335968017578, -0.013090133666992188, -0.009306907653808594, -0.005523681640625, -0.0017404556274414062, 0.0020427703857421875, 0.005825996398925781, 0.009609222412109375, 0.013392448425292969, 0.017175674438476562, 0.020958900451660156, 0.02474212646484375, 0.028525352478027344, 0.03230857849121094, 0.03609180450439453, 0.039875030517578125, 0.04365825653076172, 0.04744148254394531, 0.051224708557128906, 0.0550079345703125, 0.058791160583496094, 0.06257438659667969, 0.06635761260986328, 0.07014083862304688, 0.07392406463623047, 0.07770729064941406, 0.08149051666259766, 0.08527374267578125, 0.08905696868896484, 0.09284019470214844, 0.09662342071533203, 0.10040664672851562, 0.10418987274169922, 0.10797309875488281, 0.1117563247680664, 0.11553955078125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 7.0, 3.0, 5.0, 5.0, 5.0, 6.0, 17.0, 23.0, 44.0, 57.0, 56.0, 112.0, 180.0, 309.0, 503.0, 913.0, 1635.0, 3435.0, 7938.0, 19511.0, 55943.0, 189594.0, 945082.0, 2281870.0, 498104.0, 123345.0, 39321.0, 14650.0, 5832.0, 2706.0, 1316.0, 697.0, 404.0, 238.0, 147.0, 88.0, 66.0, 42.0, 25.0, 16.0, 14.0, 7.0, 10.0, 3.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2408447265625, -0.23262977600097656, -0.22441482543945312, -0.2161998748779297, -0.20798492431640625, -0.1997699737548828, -0.19155502319335938, -0.18334007263183594, -0.1751251220703125, -0.16691017150878906, -0.15869522094726562, -0.1504802703857422, -0.14226531982421875, -0.1340503692626953, -0.12583541870117188, -0.11762046813964844, -0.109405517578125, -0.10119056701660156, -0.09297561645507812, -0.08476066589355469, -0.07654571533203125, -0.06833076477050781, -0.060115814208984375, -0.05190086364746094, -0.0436859130859375, -0.03547096252441406, -0.027256011962890625, -0.019041061401367188, -0.01082611083984375, -0.0026111602783203125, 0.005603790283203125, 0.013818740844726562, 0.02203369140625, 0.030248641967773438, 0.038463592529296875, 0.04667854309082031, 0.05489349365234375, 0.06310844421386719, 0.07132339477539062, 0.07953834533691406, 0.0877532958984375, 0.09596824645996094, 0.10418319702148438, 0.11239814758300781, 0.12061309814453125, 0.1288280487060547, 0.13704299926757812, 0.14525794982910156, 0.153472900390625, 0.16168785095214844, 0.16990280151367188, 0.1781177520751953, 0.18633270263671875, 0.1945476531982422, 0.20276260375976562, 0.21097755432128906, 0.2191925048828125, 0.22740745544433594, 0.23562240600585938, 0.2438373565673828, 0.25205230712890625, 0.2602672576904297, 0.2684822082519531, 0.27669715881347656, 0.284912109375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 2.0, 5.0, 9.0, 13.0, 10.0, 13.0, 23.0, 29.0, 43.0, 61.0, 70.0, 80.0, 142.0, 129.0, 201.0, 356.0, 483.0, 502.0, 455.0, 356.0, 273.0, 197.0, 124.0, 108.0, 101.0, 78.0, 57.0, 52.0, 23.0, 16.0, 18.0, 14.0, 10.0, 8.0, 6.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.4091796875, -0.3977394104003906, -0.38629913330078125, -0.3748588562011719, -0.3634185791015625, -0.3519783020019531, -0.34053802490234375, -0.3290977478027344, -0.317657470703125, -0.3062171936035156, -0.29477691650390625, -0.2833366394042969, -0.2718963623046875, -0.2604560852050781, -0.24901580810546875, -0.23757553100585938, -0.22613525390625, -0.21469497680664062, -0.20325469970703125, -0.19181442260742188, -0.1803741455078125, -0.16893386840820312, -0.15749359130859375, -0.14605331420898438, -0.134613037109375, -0.12317276000976562, -0.11173248291015625, -0.10029220581054688, -0.0888519287109375, -0.07741165161132812, -0.06597137451171875, -0.054531097412109375, -0.0430908203125, -0.031650543212890625, -0.02021026611328125, -0.008769989013671875, 0.0026702880859375, 0.014110565185546875, 0.02555084228515625, 0.036991119384765625, 0.048431396484375, 0.059871673583984375, 0.07131195068359375, 0.08275222778320312, 0.0941925048828125, 0.10563278198242188, 0.11707305908203125, 0.12851333618164062, 0.13995361328125, 0.15139389038085938, 0.16283416748046875, 0.17427444458007812, 0.1857147216796875, 0.19715499877929688, 0.20859527587890625, 0.22003555297851562, 0.231475830078125, 0.24291610717773438, 0.25435638427734375, 0.2657966613769531, 0.2772369384765625, 0.2886772155761719, 0.30011749267578125, 0.3115577697753906, 0.322998046875]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 3.0, 4.0, 7.0, 19.0, 51.0, 107.0, 181.0, 220.0, 211.0, 105.0, 37.0, 18.0, 11.0, 6.0, 7.0, 5.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.286144733428955, -4.109877586364746, -3.933610439300537, -3.7573435306549072, -3.5810763835906982, -3.4048092365264893, -3.2285423278808594, -3.0522751808166504, -2.8760080337524414, -2.6997408866882324, -2.5234737396240234, -2.3472068309783936, -2.1709396839141846, -1.9946725368499756, -1.8184055089950562, -1.6421384811401367, -1.4658713340759277, -1.2896041870117188, -1.1133371591567993, -0.9370700716972351, -0.7608029842376709, -0.5845358967781067, -0.4082688093185425, -0.23200178146362305, -0.05573463439941406, 0.12053245306015015, 0.29679954051971436, 0.47306662797927856, 0.6493337154388428, 0.825600802898407, 1.0018678903579712, 1.1781349182128906, 1.3544015884399414, 1.5306687355041504, 1.7069357633590698, 1.8832027912139893, 2.0594699382781982, 2.2357370853424072, 2.412003993988037, 2.588271141052246, 2.764538288116455, 2.940805435180664, 3.117072582244873, 3.293339490890503, 3.469606637954712, 3.645873785018921, 3.822140693664551, 3.9984078407287598, 4.174674987792969, 4.350942134857178, 4.527209281921387, 4.703476428985596, 4.879743576049805, 5.0560102462768555, 5.2322773933410645, 5.408544540405273, 5.584811687469482, 5.761078834533691, 5.9373459815979, 6.113613128662109, 6.28987979888916, 6.466146945953369, 6.642414093017578, 6.818681240081787, 6.994948387145996]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 2.0, 5.0, 1.0, 7.0, 10.0, 13.0, 11.0, 15.0, 18.0, 12.0, 17.0, 25.0, 34.0, 26.0, 33.0, 45.0, 50.0, 53.0, 51.0, 42.0, 47.0, 40.0, 43.0, 47.0, 46.0, 47.0, 30.0, 38.0, 30.0, 24.0, 26.0, 21.0, 22.0, 13.0, 16.0, 8.0, 12.0, 3.0, 4.0, 4.0, 6.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.864199161529541, -1.7974910736083984, -1.7307828664779663, -1.6640747785568237, -1.5973665714263916, -1.530658483505249, -1.4639503955841064, -1.3972423076629639, -1.3305341005325317, -1.2638260126113892, -1.197117805480957, -1.1304097175598145, -1.0637016296386719, -0.9969934225082397, -0.9302853345870972, -0.8635771870613098, -0.7968690395355225, -0.7301608920097351, -0.6634527444839478, -0.5967446565628052, -0.5300365090370178, -0.46332836151123047, -0.3966202437877655, -0.32991212606430054, -0.2632039785385132, -0.19649584591388702, -0.12978771328926086, -0.0630795806646347, 0.003628551959991455, 0.07033669948577881, 0.13704481720924377, 0.20375293493270874, 0.2704613208770752, 0.33716946840286255, 0.4038775861263275, 0.4705857038497925, 0.5372938513755798, 0.6040019989013672, 0.6707100868225098, 0.7374182343482971, 0.8041263818740845, 0.8708345293998718, 0.9375426769256592, 1.0042507648468018, 1.0709588527679443, 1.1376670598983765, 1.204375147819519, 1.2710833549499512, 1.3377914428710938, 1.4044995307922363, 1.4712077379226685, 1.537915825843811, 1.6046240329742432, 1.6713321208953857, 1.7380402088165283, 1.804748296737671, 1.871456503868103, 1.9381645917892456, 2.0048727989196777, 2.0715808868408203, 2.138288974761963, 2.2049970626831055, 2.271705389022827, 2.3384134769439697, 2.4051215648651123]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 2.0, 1.0, 8.0, 13.0, 11.0, 16.0, 26.0, 28.0, 46.0, 56.0, 97.0, 159.0, 235.0, 372.0, 616.0, 963.0, 1620.0, 2718.0, 5015.0, 9445.0, 17996.0, 36195.0, 76643.0, 190889.0, 375772.0, 182215.0, 74294.0, 35131.0, 17456.0, 8969.0, 4851.0, 2662.0, 1591.0, 896.0, 576.0, 349.0, 218.0, 133.0, 86.0, 60.0, 39.0, 25.0, 22.0, 12.0, 14.0, 6.0, 7.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.3076171875, -0.2986946105957031, -0.28977203369140625, -0.2808494567871094, -0.2719268798828125, -0.2630043029785156, -0.25408172607421875, -0.24515914916992188, -0.236236572265625, -0.22731399536132812, -0.21839141845703125, -0.20946884155273438, -0.2005462646484375, -0.19162368774414062, -0.18270111083984375, -0.17377853393554688, -0.16485595703125, -0.15593338012695312, -0.14701080322265625, -0.13808822631835938, -0.1291656494140625, -0.12024307250976562, -0.11132049560546875, -0.10239791870117188, -0.093475341796875, -0.08455276489257812, -0.07563018798828125, -0.06670761108398438, -0.0577850341796875, -0.048862457275390625, -0.03993988037109375, -0.031017303466796875, -0.0220947265625, -0.013172149658203125, -0.00424957275390625, 0.004673004150390625, 0.0135955810546875, 0.022518157958984375, 0.03144073486328125, 0.040363311767578125, 0.049285888671875, 0.058208465576171875, 0.06713104248046875, 0.07605361938476562, 0.0849761962890625, 0.09389877319335938, 0.10282135009765625, 0.11174392700195312, 0.12066650390625, 0.12958908081054688, 0.13851165771484375, 0.14743423461914062, 0.1563568115234375, 0.16527938842773438, 0.17420196533203125, 0.18312454223632812, 0.192047119140625, 0.20096969604492188, 0.20989227294921875, 0.21881484985351562, 0.2277374267578125, 0.23666000366210938, 0.24558258056640625, 0.2545051574707031, 0.263427734375]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 7.0, 5.0, 14.0, 13.0, 11.0, 15.0, 20.0, 20.0, 35.0, 25.0, 34.0, 51.0, 49.0, 45.0, 65.0, 60.0, 65.0, 57.0, 56.0, 59.0, 51.0, 47.0, 41.0, 33.0, 17.0, 35.0, 20.0, 15.0, 13.0, 13.0, 4.0, 4.0, 4.0, 2.0, 6.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1636962890625, -0.1584949493408203, -0.15329360961914062, -0.14809226989746094, -0.14289093017578125, -0.13768959045410156, -0.13248825073242188, -0.1272869110107422, -0.1220855712890625, -0.11688423156738281, -0.11168289184570312, -0.10648155212402344, -0.10128021240234375, -0.09607887268066406, -0.09087753295898438, -0.08567619323730469, -0.080474853515625, -0.07527351379394531, -0.07007217407226562, -0.06487083435058594, -0.05966949462890625, -0.05446815490722656, -0.049266815185546875, -0.04406547546386719, -0.0388641357421875, -0.03366279602050781, -0.028461456298828125, -0.023260116577148438, -0.01805877685546875, -0.012857437133789062, -0.007656097412109375, -0.0024547576904296875, 0.00274658203125, 0.007947921752929688, 0.013149261474609375, 0.018350601196289062, 0.02355194091796875, 0.028753280639648438, 0.033954620361328125, 0.03915596008300781, 0.0443572998046875, 0.04955863952636719, 0.054759979248046875, 0.05996131896972656, 0.06516265869140625, 0.07036399841308594, 0.07556533813476562, 0.08076667785644531, 0.085968017578125, 0.09116935729980469, 0.09637069702148438, 0.10157203674316406, 0.10677337646484375, 0.11197471618652344, 0.11717605590820312, 0.12237739562988281, 0.1275787353515625, 0.1327800750732422, 0.13798141479492188, 0.14318275451660156, 0.14838409423828125, 0.15358543395996094, 0.15878677368164062, 0.1639881134033203, 0.169189453125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 7.0, 5.0, 4.0, 15.0, 11.0, 13.0, 21.0, 31.0, 34.0, 42.0, 51.0, 70.0, 109.0, 142.0, 213.0, 291.0, 461.0, 699.0, 1162.0, 1968.0, 4022.0, 10363.0, 38459.0, 256636.0, 641945.0, 65302.0, 14918.0, 5232.0, 2453.0, 1335.0, 767.0, 536.0, 357.0, 248.0, 167.0, 133.0, 94.0, 59.0, 51.0, 38.0, 27.0, 13.0, 12.0, 11.0, 5.0, 7.0, 6.0, 5.0, 6.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0], "bins": [-0.6259765625, -0.6058883666992188, -0.5858001708984375, -0.5657119750976562, -0.545623779296875, -0.5255355834960938, -0.5054473876953125, -0.48535919189453125, -0.46527099609375, -0.44518280029296875, -0.4250946044921875, -0.40500640869140625, -0.384918212890625, -0.36483001708984375, -0.3447418212890625, -0.32465362548828125, -0.3045654296875, -0.28447723388671875, -0.2643890380859375, -0.24430084228515625, -0.224212646484375, -0.20412445068359375, -0.1840362548828125, -0.16394805908203125, -0.14385986328125, -0.12377166748046875, -0.1036834716796875, -0.08359527587890625, -0.063507080078125, -0.04341888427734375, -0.0233306884765625, -0.00324249267578125, 0.016845703125, 0.03693389892578125, 0.0570220947265625, 0.07711029052734375, 0.097198486328125, 0.11728668212890625, 0.1373748779296875, 0.15746307373046875, 0.17755126953125, 0.19763946533203125, 0.2177276611328125, 0.23781585693359375, 0.257904052734375, 0.27799224853515625, 0.2980804443359375, 0.31816864013671875, 0.3382568359375, 0.35834503173828125, 0.3784332275390625, 0.39852142333984375, 0.418609619140625, 0.43869781494140625, 0.4587860107421875, 0.47887420654296875, 0.49896240234375, 0.5190505981445312, 0.5391387939453125, 0.5592269897460938, 0.579315185546875, 0.5994033813476562, 0.6194915771484375, 0.6395797729492188, 0.65966796875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 6.0, 3.0, 8.0, 6.0, 18.0, 14.0, 12.0, 16.0, 20.0, 25.0, 26.0, 34.0, 28.0, 21.0, 33.0, 53.0, 53.0, 57.0, 40.0, 49.0, 46.0, 55.0, 50.0, 40.0, 48.0, 39.0, 24.0, 24.0, 28.0, 22.0, 17.0, 11.0, 17.0, 14.0, 9.0, 10.0, 7.0, 4.0, 2.0, 4.0, 6.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.60498046875, -0.5840911865234375, -0.563201904296875, -0.5423126220703125, -0.52142333984375, -0.5005340576171875, -0.479644775390625, -0.4587554931640625, -0.4378662109375, -0.4169769287109375, -0.396087646484375, -0.3751983642578125, -0.35430908203125, -0.3334197998046875, -0.312530517578125, -0.2916412353515625, -0.270751953125, -0.2498626708984375, -0.228973388671875, -0.2080841064453125, -0.18719482421875, -0.1663055419921875, -0.145416259765625, -0.1245269775390625, -0.1036376953125, -0.0827484130859375, -0.061859130859375, -0.0409698486328125, -0.02008056640625, 0.0008087158203125, 0.021697998046875, 0.0425872802734375, 0.0634765625, 0.0843658447265625, 0.105255126953125, 0.1261444091796875, 0.14703369140625, 0.1679229736328125, 0.188812255859375, 0.2097015380859375, 0.2305908203125, 0.2514801025390625, 0.272369384765625, 0.2932586669921875, 0.31414794921875, 0.3350372314453125, 0.355926513671875, 0.3768157958984375, 0.397705078125, 0.4185943603515625, 0.439483642578125, 0.4603729248046875, 0.48126220703125, 0.5021514892578125, 0.523040771484375, 0.5439300537109375, 0.5648193359375, 0.5857086181640625, 0.606597900390625, 0.6274871826171875, 0.64837646484375, 0.6692657470703125, 0.690155029296875, 0.7110443115234375, 0.73193359375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 6.0, 5.0, 8.0, 8.0, 12.0, 23.0, 28.0, 40.0, 29.0, 63.0, 78.0, 123.0, 224.0, 304.0, 508.0, 884.0, 1759.0, 3947.0, 10376.0, 32241.0, 125353.0, 637810.0, 170847.0, 41538.0, 12740.0, 4769.0, 2147.0, 1141.0, 547.0, 319.0, 207.0, 112.0, 98.0, 75.0, 46.0, 39.0, 19.0, 20.0, 15.0, 13.0, 10.0, 7.0, 2.0, 4.0, 3.0, 1.0, 2.0, 6.0, 2.0, 3.0], "bins": [-0.2335205078125, -0.2269611358642578, -0.22040176391601562, -0.21384239196777344, -0.20728302001953125, -0.20072364807128906, -0.19416427612304688, -0.1876049041748047, -0.1810455322265625, -0.1744861602783203, -0.16792678833007812, -0.16136741638183594, -0.15480804443359375, -0.14824867248535156, -0.14168930053710938, -0.1351299285888672, -0.128570556640625, -0.12201118469238281, -0.11545181274414062, -0.10889244079589844, -0.10233306884765625, -0.09577369689941406, -0.08921432495117188, -0.08265495300292969, -0.0760955810546875, -0.06953620910644531, -0.06297683715820312, -0.05641746520996094, -0.04985809326171875, -0.04329872131347656, -0.036739349365234375, -0.030179977416992188, -0.02362060546875, -0.017061233520507812, -0.010501861572265625, -0.0039424896240234375, 0.00261688232421875, 0.009176254272460938, 0.015735626220703125, 0.022294998168945312, 0.0288543701171875, 0.03541374206542969, 0.041973114013671875, 0.04853248596191406, 0.05509185791015625, 0.06165122985839844, 0.06821060180664062, 0.07476997375488281, 0.081329345703125, 0.08788871765136719, 0.09444808959960938, 0.10100746154785156, 0.10756683349609375, 0.11412620544433594, 0.12068557739257812, 0.1272449493408203, 0.1338043212890625, 0.1403636932373047, 0.14692306518554688, 0.15348243713378906, 0.16004180908203125, 0.16660118103027344, 0.17316055297851562, 0.1797199249267578, 0.186279296875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 3.0, 3.0, 2.0, 4.0, 1.0, 8.0, 4.0, 7.0, 8.0, 10.0, 16.0, 18.0, 12.0, 22.0, 34.0, 34.0, 49.0, 47.0, 80.0, 82.0, 104.0, 90.0, 66.0, 64.0, 48.0, 25.0, 31.0, 19.0, 18.0, 18.0, 18.0, 9.0, 12.0, 11.0, 5.0, 6.0, 4.0, 4.0, 8.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-8.147954940795898e-05, -7.880479097366333e-05, -7.613003253936768e-05, -7.345527410507202e-05, -7.078051567077637e-05, -6.810575723648071e-05, -6.543099880218506e-05, -6.27562403678894e-05, -6.008148193359375e-05, -5.7406723499298096e-05, -5.473196506500244e-05, -5.205720663070679e-05, -4.938244819641113e-05, -4.670768976211548e-05, -4.4032931327819824e-05, -4.135817289352417e-05, -3.8683414459228516e-05, -3.600865602493286e-05, -3.333389759063721e-05, -3.065913915634155e-05, -2.79843807220459e-05, -2.5309622287750244e-05, -2.263486385345459e-05, -1.9960105419158936e-05, -1.728534698486328e-05, -1.4610588550567627e-05, -1.1935830116271973e-05, -9.261071681976318e-06, -6.586313247680664e-06, -3.91155481338501e-06, -1.2367963790893555e-06, 1.4379620552062988e-06, 4.112720489501953e-06, 6.787478923797607e-06, 9.462237358093262e-06, 1.2136995792388916e-05, 1.481175422668457e-05, 1.7486512660980225e-05, 2.016127109527588e-05, 2.2836029529571533e-05, 2.5510787963867188e-05, 2.8185546398162842e-05, 3.0860304832458496e-05, 3.353506326675415e-05, 3.6209821701049805e-05, 3.888458013534546e-05, 4.155933856964111e-05, 4.423409700393677e-05, 4.690885543823242e-05, 4.9583613872528076e-05, 5.225837230682373e-05, 5.4933130741119385e-05, 5.760788917541504e-05, 6.028264760971069e-05, 6.295740604400635e-05, 6.5632164478302e-05, 6.830692291259766e-05, 7.098168134689331e-05, 7.365643978118896e-05, 7.633119821548462e-05, 7.900595664978027e-05, 8.168071508407593e-05, 8.435547351837158e-05, 8.703023195266724e-05, 8.970499038696289e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 1.0, 4.0, 8.0, 11.0, 23.0, 25.0, 32.0, 65.0, 85.0, 215.0, 442.0, 908.0, 2322.0, 7648.0, 55244.0, 857245.0, 108618.0, 10587.0, 2938.0, 1114.0, 474.0, 235.0, 126.0, 78.0, 38.0, 22.0, 14.0, 9.0, 6.0, 7.0, 5.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.442138671875, -0.42858123779296875, -0.4150238037109375, -0.40146636962890625, -0.387908935546875, -0.37435150146484375, -0.3607940673828125, -0.34723663330078125, -0.33367919921875, -0.32012176513671875, -0.3065643310546875, -0.29300689697265625, -0.279449462890625, -0.26589202880859375, -0.2523345947265625, -0.23877716064453125, -0.2252197265625, -0.21166229248046875, -0.1981048583984375, -0.18454742431640625, -0.170989990234375, -0.15743255615234375, -0.1438751220703125, -0.13031768798828125, -0.11676025390625, -0.10320281982421875, -0.0896453857421875, -0.07608795166015625, -0.062530517578125, -0.04897308349609375, -0.0354156494140625, -0.02185821533203125, -0.00830078125, 0.00525665283203125, 0.0188140869140625, 0.03237152099609375, 0.045928955078125, 0.05948638916015625, 0.0730438232421875, 0.08660125732421875, 0.10015869140625, 0.11371612548828125, 0.1272735595703125, 0.14083099365234375, 0.154388427734375, 0.16794586181640625, 0.1815032958984375, 0.19506072998046875, 0.2086181640625, 0.22217559814453125, 0.2357330322265625, 0.24929046630859375, 0.262847900390625, 0.27640533447265625, 0.2899627685546875, 0.30352020263671875, 0.31707763671875, 0.33063507080078125, 0.3441925048828125, 0.35774993896484375, 0.371307373046875, 0.38486480712890625, 0.3984222412109375, 0.41197967529296875, 0.425537109375]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 2.0, 5.0, 5.0, 4.0, 12.0, 7.0, 13.0, 19.0, 21.0, 39.0, 42.0, 47.0, 39.0, 46.0, 94.0, 86.0, 111.0, 96.0, 66.0, 57.0, 36.0, 36.0, 23.0, 20.0, 16.0, 9.0, 11.0, 7.0, 12.0, 8.0, 5.0, 3.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.29345703125, -0.28507232666015625, -0.2766876220703125, -0.26830291748046875, -0.259918212890625, -0.25153350830078125, -0.2431488037109375, -0.23476409912109375, -0.22637939453125, -0.21799468994140625, -0.2096099853515625, -0.20122528076171875, -0.192840576171875, -0.18445587158203125, -0.1760711669921875, -0.16768646240234375, -0.1593017578125, -0.15091705322265625, -0.1425323486328125, -0.13414764404296875, -0.125762939453125, -0.11737823486328125, -0.1089935302734375, -0.10060882568359375, -0.09222412109375, -0.08383941650390625, -0.0754547119140625, -0.06707000732421875, -0.058685302734375, -0.05030059814453125, -0.0419158935546875, -0.03353118896484375, -0.025146484375, -0.01676177978515625, -0.0083770751953125, 7.62939453125e-06, 0.008392333984375, 0.01677703857421875, 0.0251617431640625, 0.03354644775390625, 0.04193115234375, 0.05031585693359375, 0.0587005615234375, 0.06708526611328125, 0.075469970703125, 0.08385467529296875, 0.0922393798828125, 0.10062408447265625, 0.1090087890625, 0.11739349365234375, 0.1257781982421875, 0.13416290283203125, 0.142547607421875, 0.15093231201171875, 0.1593170166015625, 0.16770172119140625, 0.17608642578125, 0.18447113037109375, 0.1928558349609375, 0.20124053955078125, 0.209625244140625, 0.21800994873046875, 0.2263946533203125, 0.23477935791015625, 0.2431640625]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 1.0, 1.0, 5.0, 4.0, 11.0, 25.0, 128.0, 297.0, 340.0, 135.0, 27.0, 18.0, 1.0, 4.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.926177978515625, -12.611329078674316, -12.296481132507324, -11.981632232666016, -11.666784286499023, -11.351935386657715, -11.037087440490723, -10.722238540649414, -10.407390594482422, -10.092541694641113, -9.777693748474121, -9.462844848632812, -9.14799690246582, -8.833148002624512, -8.51830005645752, -8.203451156616211, -7.888602256774902, -7.573753833770752, -7.258905410766602, -6.944056987762451, -6.629208564758301, -6.314359664916992, -5.999511241912842, -5.684662818908691, -5.369814395904541, -5.054965972900391, -4.74011754989624, -4.42526912689209, -4.110420227050781, -3.79557204246521, -3.4807233810424805, -3.16587495803833, -2.851027488708496, -2.5361790657043457, -2.2213306427001953, -1.9064819812774658, -1.5916335582733154, -1.276785135269165, -0.9619365930557251, -0.6470880508422852, -0.33223962783813477, -0.0173911452293396, 0.29745733737945557, 0.6123058199882507, 0.9271543025970459, 1.2420027256011963, 1.5568512678146362, 1.8716998100280762, 2.1865482330322266, 2.501396656036377, 2.8162450790405273, 3.131093740463257, 3.4459421634674072, 3.7607905864715576, 4.075639247894287, 4.3904876708984375, 4.705336093902588, 5.020184516906738, 5.335032939910889, 5.649881362915039, 5.964730262756348, 6.27957820892334, 6.594427108764648, 6.909275531768799, 7.224123954772949]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 9.0, 2.0, 7.0, 11.0, 15.0, 16.0, 13.0, 20.0, 18.0, 34.0, 22.0, 33.0, 46.0, 31.0, 51.0, 55.0, 57.0, 71.0, 67.0, 58.0, 41.0, 46.0, 26.0, 30.0, 33.0, 30.0, 30.0, 20.0, 17.0, 17.0, 10.0, 12.0, 11.0, 9.0, 4.0, 8.0, 5.0, 4.0, 4.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.563842296600342, -2.479626417160034, -2.3954105377197266, -2.31119441986084, -2.2269785404205322, -2.1427626609802246, -2.058546781539917, -1.9743309020996094, -1.8901149034500122, -1.8058990240097046, -1.7216830253601074, -1.6374671459197998, -1.5532512664794922, -1.469035267829895, -1.3848193883895874, -1.3006033897399902, -1.2163875102996826, -1.132171630859375, -1.0479556322097778, -0.9637397527694702, -0.8795238137245178, -0.7953078746795654, -0.7110919952392578, -0.6268760561943054, -0.542660117149353, -0.45844417810440063, -0.37422826886177063, -0.2900123596191406, -0.20579642057418823, -0.12158048152923584, -0.03736460208892822, 0.04685133695602417, 0.13106727600097656, 0.21528320014476776, 0.29949912428855896, 0.38371503353118896, 0.46793097257614136, 0.5521469116210938, 0.6363627910614014, 0.7205787301063538, 0.8047946691513062, 0.8890106081962585, 0.9732265472412109, 1.0574424266815186, 1.1416583061218262, 1.2258743047714233, 1.310090184211731, 1.3943061828613281, 1.4785220623016357, 1.5627379417419434, 1.6469539403915405, 1.7311698198318481, 1.8153858184814453, 1.899601697921753, 1.9838175773620605, 2.068033456802368, 2.152249336242676, 2.2364652156829834, 2.320681095123291, 2.4048972129821777, 2.4891130924224854, 2.573328971862793, 2.6575448513031006, 2.741760730743408, 2.825976848602295]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 3.0, 3.0, 6.0, 10.0, 18.0, 10.0, 23.0, 38.0, 78.0, 136.0, 299.0, 618.0, 1521.0, 4102.0, 12535.0, 46551.0, 244330.0, 2054875.0, 1587099.0, 186698.0, 38449.0, 10621.0, 3637.0, 1316.0, 653.0, 270.0, 161.0, 66.0, 43.0, 36.0, 16.0, 12.0, 12.0, 8.0, 10.0, 7.0, 3.0, 6.0, 1.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2440185546875, -0.23528099060058594, -0.22654342651367188, -0.2178058624267578, -0.20906829833984375, -0.2003307342529297, -0.19159317016601562, -0.18285560607910156, -0.1741180419921875, -0.16538047790527344, -0.15664291381835938, -0.1479053497314453, -0.13916778564453125, -0.1304302215576172, -0.12169265747070312, -0.11295509338378906, -0.104217529296875, -0.09547996520996094, -0.08674240112304688, -0.07800483703613281, -0.06926727294921875, -0.06052970886230469, -0.051792144775390625, -0.04305458068847656, -0.0343170166015625, -0.025579452514648438, -0.016841888427734375, -0.008104324340820312, 0.00063323974609375, 0.009370803833007812, 0.018108367919921875, 0.026845932006835938, 0.03558349609375, 0.04432106018066406, 0.053058624267578125, 0.06179618835449219, 0.07053375244140625, 0.07927131652832031, 0.08800888061523438, 0.09674644470214844, 0.1054840087890625, 0.11422157287597656, 0.12295913696289062, 0.1316967010498047, 0.14043426513671875, 0.1491718292236328, 0.15790939331054688, 0.16664695739746094, 0.175384521484375, 0.18412208557128906, 0.19285964965820312, 0.2015972137451172, 0.21033477783203125, 0.2190723419189453, 0.22780990600585938, 0.23654747009277344, 0.2452850341796875, 0.25402259826660156, 0.2627601623535156, 0.2714977264404297, 0.28023529052734375, 0.2889728546142578, 0.2977104187011719, 0.30644798278808594, 0.315185546875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 3.0, 4.0, 4.0, 7.0, 4.0, 11.0, 4.0, 8.0, 9.0, 22.0, 17.0, 25.0, 24.0, 20.0, 30.0, 26.0, 35.0, 38.0, 37.0, 51.0, 42.0, 41.0, 50.0, 45.0, 34.0, 48.0, 32.0, 46.0, 54.0, 36.0, 33.0, 23.0, 23.0, 21.0, 17.0, 17.0, 12.0, 13.0, 6.0, 10.0, 6.0, 4.0, 2.0, 3.0, 6.0, 1.0, 2.0, 1.0, 3.0], "bins": [-0.15283203125, -0.14876365661621094, -0.14469528198242188, -0.1406269073486328, -0.13655853271484375, -0.1324901580810547, -0.12842178344726562, -0.12435340881347656, -0.1202850341796875, -0.11621665954589844, -0.11214828491210938, -0.10807991027832031, -0.10401153564453125, -0.09994316101074219, -0.09587478637695312, -0.09180641174316406, -0.087738037109375, -0.08366966247558594, -0.07960128784179688, -0.07553291320800781, -0.07146453857421875, -0.06739616394042969, -0.06332778930664062, -0.05925941467285156, -0.0551910400390625, -0.05112266540527344, -0.047054290771484375, -0.04298591613769531, -0.03891754150390625, -0.03484916687011719, -0.030780792236328125, -0.026712417602539062, -0.02264404296875, -0.018575668334960938, -0.014507293701171875, -0.010438919067382812, -0.00637054443359375, -0.0023021697998046875, 0.001766204833984375, 0.0058345794677734375, 0.0099029541015625, 0.013971328735351562, 0.018039703369140625, 0.022108078002929688, 0.02617645263671875, 0.030244827270507812, 0.034313201904296875, 0.03838157653808594, 0.042449951171875, 0.04651832580566406, 0.050586700439453125, 0.05465507507324219, 0.05872344970703125, 0.06279182434082031, 0.06686019897460938, 0.07092857360839844, 0.0749969482421875, 0.07906532287597656, 0.08313369750976562, 0.08720207214355469, 0.09127044677734375, 0.09533882141113281, 0.09940719604492188, 0.10347557067871094, 0.1075439453125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 3.0, 5.0, 11.0, 15.0, 17.0, 19.0, 39.0, 65.0, 108.0, 188.0, 337.0, 723.0, 1851.0, 5382.0, 18309.0, 75503.0, 454144.0, 2751928.0, 739996.0, 108779.0, 24889.0, 7302.0, 2512.0, 1026.0, 473.0, 280.0, 148.0, 84.0, 40.0, 35.0, 22.0, 11.0, 15.0, 7.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.402587890625, -0.3915901184082031, -0.38059234619140625, -0.3695945739746094, -0.3585968017578125, -0.3475990295410156, -0.33660125732421875, -0.3256034851074219, -0.314605712890625, -0.3036079406738281, -0.29261016845703125, -0.2816123962402344, -0.2706146240234375, -0.2596168518066406, -0.24861907958984375, -0.23762130737304688, -0.22662353515625, -0.21562576293945312, -0.20462799072265625, -0.19363021850585938, -0.1826324462890625, -0.17163467407226562, -0.16063690185546875, -0.14963912963867188, -0.138641357421875, -0.12764358520507812, -0.11664581298828125, -0.10564804077148438, -0.0946502685546875, -0.08365249633789062, -0.07265472412109375, -0.061656951904296875, -0.0506591796875, -0.039661407470703125, -0.02866363525390625, -0.017665863037109375, -0.0066680908203125, 0.004329681396484375, 0.01532745361328125, 0.026325225830078125, 0.037322998046875, 0.048320770263671875, 0.05931854248046875, 0.07031631469726562, 0.0813140869140625, 0.09231185913085938, 0.10330963134765625, 0.11430740356445312, 0.12530517578125, 0.13630294799804688, 0.14730072021484375, 0.15829849243164062, 0.1692962646484375, 0.18029403686523438, 0.19129180908203125, 0.20228958129882812, 0.213287353515625, 0.22428512573242188, 0.23528289794921875, 0.24628067016601562, 0.2572784423828125, 0.2682762145996094, 0.27927398681640625, 0.2902717590332031, 0.30126953125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 4.0, 0.0, 5.0, 5.0, 3.0, 7.0, 10.0, 16.0, 13.0, 16.0, 32.0, 28.0, 48.0, 39.0, 75.0, 103.0, 128.0, 176.0, 275.0, 339.0, 403.0, 478.0, 420.0, 377.0, 266.0, 199.0, 143.0, 112.0, 93.0, 48.0, 43.0, 52.0, 23.0, 21.0, 19.0, 12.0, 17.0, 7.0, 11.0, 5.0, 6.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.278076171875, -0.2672309875488281, -0.25638580322265625, -0.24554061889648438, -0.2346954345703125, -0.22385025024414062, -0.21300506591796875, -0.20215988159179688, -0.191314697265625, -0.18046951293945312, -0.16962432861328125, -0.15877914428710938, -0.1479339599609375, -0.13708877563476562, -0.12624359130859375, -0.11539840698242188, -0.10455322265625, -0.09370803833007812, -0.08286285400390625, -0.07201766967773438, -0.0611724853515625, -0.050327301025390625, -0.03948211669921875, -0.028636932373046875, -0.017791748046875, -0.006946563720703125, 0.00389862060546875, 0.014743804931640625, 0.0255889892578125, 0.036434173583984375, 0.04727935791015625, 0.058124542236328125, 0.0689697265625, 0.07981491088867188, 0.09066009521484375, 0.10150527954101562, 0.1123504638671875, 0.12319564819335938, 0.13404083251953125, 0.14488601684570312, 0.155731201171875, 0.16657638549804688, 0.17742156982421875, 0.18826675415039062, 0.1991119384765625, 0.20995712280273438, 0.22080230712890625, 0.23164749145507812, 0.24249267578125, 0.2533378601074219, 0.26418304443359375, 0.2750282287597656, 0.2858734130859375, 0.2967185974121094, 0.30756378173828125, 0.3184089660644531, 0.329254150390625, 0.3400993347167969, 0.35094451904296875, 0.3617897033691406, 0.3726348876953125, 0.3834800720214844, 0.39432525634765625, 0.4051704406738281, 0.416015625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 4.0, 9.0, 15.0, 26.0, 47.0, 93.0, 137.0, 201.0, 167.0, 117.0, 81.0, 38.0, 25.0, 9.0, 6.0, 4.0, 7.0, 0.0, 0.0, 3.0, 2.0, 5.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-3.917229652404785, -3.7754342555999756, -3.633638858795166, -3.4918434619903564, -3.350048065185547, -3.208252429962158, -3.0664570331573486, -2.924661636352539, -2.7828662395477295, -2.64107084274292, -2.4992754459381104, -2.357480049133301, -2.215684413909912, -2.0738892555236816, -1.932093620300293, -1.7902982234954834, -1.6485028266906738, -1.5067074298858643, -1.3649120330810547, -1.2231165170669556, -1.081321120262146, -0.9395257234573364, -0.7977302670478821, -0.6559348106384277, -0.5141394138336182, -0.3723439872264862, -0.23054856061935425, -0.08875313401222229, 0.05304229259490967, 0.19483768939971924, 0.3366331458091736, 0.47842860221862793, 0.6202239990234375, 0.7620193958282471, 0.9038148522377014, 1.0456103086471558, 1.1874057054519653, 1.329201102256775, 1.470996618270874, 1.6127920150756836, 1.7545874118804932, 1.8963828086853027, 2.0381782054901123, 2.179973602294922, 2.3217692375183105, 2.463564395904541, 2.6053600311279297, 2.7471554279327393, 2.888950824737549, 3.0307462215423584, 3.172541618347168, 3.3143370151519775, 3.456132411956787, 3.597928047180176, 3.7397234439849854, 3.881518840789795, 4.023314476013184, 4.165110111236572, 4.306905269622803, 4.448700904846191, 4.590496063232422, 4.7322916984558105, 4.874086856842041, 5.01588249206543, 5.15767765045166]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 9.0, 3.0, 2.0, 4.0, 7.0, 9.0, 10.0, 12.0, 15.0, 17.0, 16.0, 20.0, 20.0, 24.0, 29.0, 32.0, 27.0, 27.0, 34.0, 47.0, 36.0, 34.0, 37.0, 47.0, 32.0, 37.0, 55.0, 38.0, 34.0, 38.0, 30.0, 35.0, 31.0, 15.0, 23.0, 27.0, 19.0, 16.0, 9.0, 12.0, 6.0, 7.0, 4.0, 1.0, 4.0, 4.0, 5.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0], "bins": [-1.8330843448638916, -1.777659296989441, -1.7222343683242798, -1.666809320449829, -1.6113842725753784, -1.5559592247009277, -1.5005342960357666, -1.445109248161316, -1.3896842002868652, -1.3342591524124146, -1.2788342237472534, -1.2234091758728027, -1.167984127998352, -1.1125590801239014, -1.0571341514587402, -1.0017091035842896, -0.9462841749191284, -0.8908591866493225, -0.8354341387748718, -0.7800091505050659, -0.7245841026306152, -0.6691591143608093, -0.6137341260910034, -0.5583090782165527, -0.5028840899467468, -0.44745907187461853, -0.39203405380249023, -0.3366090655326843, -0.28118404746055603, -0.22575902938842773, -0.17033404111862183, -0.11490902304649353, -0.059484124183654785, -0.004059113562107086, 0.05136589705944061, 0.10679090023040771, 0.162215918302536, 0.2176409363746643, 0.2730659246444702, 0.3284909427165985, 0.3839159607887268, 0.4393409788608551, 0.4947659969329834, 0.5501909852027893, 0.6056159734725952, 0.6610410213470459, 0.7164660096168518, 0.7718909978866577, 0.8273160457611084, 0.8827410340309143, 0.938166081905365, 0.9935910701751709, 1.0490161180496216, 1.1044411659240723, 1.1598660945892334, 1.215291142463684, 1.2707161903381348, 1.3261412382125854, 1.3815661668777466, 1.4369912147521973, 1.492416262626648, 1.5478413105010986, 1.6032662391662598, 1.6586912870407104, 1.7141162157058716]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 4.0, 2.0, 6.0, 18.0, 17.0, 31.0, 59.0, 100.0, 188.0, 306.0, 547.0, 1129.0, 2350.0, 4961.0, 11994.0, 33036.0, 122831.0, 536307.0, 249478.0, 54054.0, 17644.0, 6962.0, 3226.0, 1569.0, 780.0, 418.0, 236.0, 113.0, 78.0, 48.0, 19.0, 12.0, 6.0, 9.0, 4.0, 4.0, 2.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.428466796875, -0.41536712646484375, -0.4022674560546875, -0.38916778564453125, -0.376068115234375, -0.36296844482421875, -0.3498687744140625, -0.33676910400390625, -0.32366943359375, -0.31056976318359375, -0.2974700927734375, -0.28437042236328125, -0.271270751953125, -0.25817108154296875, -0.2450714111328125, -0.23197174072265625, -0.2188720703125, -0.20577239990234375, -0.1926727294921875, -0.17957305908203125, -0.166473388671875, -0.15337371826171875, -0.1402740478515625, -0.12717437744140625, -0.11407470703125, -0.10097503662109375, -0.0878753662109375, -0.07477569580078125, -0.061676025390625, -0.04857635498046875, -0.0354766845703125, -0.02237701416015625, -0.00927734375, 0.00382232666015625, 0.0169219970703125, 0.03002166748046875, 0.043121337890625, 0.05622100830078125, 0.0693206787109375, 0.08242034912109375, 0.09552001953125, 0.10861968994140625, 0.1217193603515625, 0.13481903076171875, 0.147918701171875, 0.16101837158203125, 0.1741180419921875, 0.18721771240234375, 0.2003173828125, 0.21341705322265625, 0.2265167236328125, 0.23961639404296875, 0.252716064453125, 0.26581573486328125, 0.2789154052734375, 0.29201507568359375, 0.30511474609375, 0.31821441650390625, 0.3313140869140625, 0.34441375732421875, 0.357513427734375, 0.37061309814453125, 0.3837127685546875, 0.39681243896484375, 0.409912109375]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 6.0, 6.0, 8.0, 13.0, 7.0, 20.0, 13.0, 19.0, 36.0, 33.0, 25.0, 42.0, 35.0, 47.0, 52.0, 52.0, 58.0, 60.0, 53.0, 66.0, 55.0, 64.0, 38.0, 39.0, 40.0, 23.0, 24.0, 21.0, 12.0, 13.0, 10.0, 5.0, 2.0, 7.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1702880859375, -0.16463470458984375, -0.1589813232421875, -0.15332794189453125, -0.147674560546875, -0.14202117919921875, -0.1363677978515625, -0.13071441650390625, -0.12506103515625, -0.11940765380859375, -0.1137542724609375, -0.10810089111328125, -0.102447509765625, -0.09679412841796875, -0.0911407470703125, -0.08548736572265625, -0.079833984375, -0.07418060302734375, -0.0685272216796875, -0.06287384033203125, -0.057220458984375, -0.05156707763671875, -0.0459136962890625, -0.04026031494140625, -0.03460693359375, -0.02895355224609375, -0.0233001708984375, -0.01764678955078125, -0.011993408203125, -0.00634002685546875, -0.0006866455078125, 0.00496673583984375, 0.0106201171875, 0.01627349853515625, 0.0219268798828125, 0.02758026123046875, 0.033233642578125, 0.03888702392578125, 0.0445404052734375, 0.05019378662109375, 0.05584716796875, 0.06150054931640625, 0.0671539306640625, 0.07280731201171875, 0.078460693359375, 0.08411407470703125, 0.0897674560546875, 0.09542083740234375, 0.10107421875, 0.10672760009765625, 0.1123809814453125, 0.11803436279296875, 0.123687744140625, 0.12934112548828125, 0.1349945068359375, 0.14064788818359375, 0.14630126953125, 0.15195465087890625, 0.1576080322265625, 0.16326141357421875, 0.168914794921875, 0.17456817626953125, 0.1802215576171875, 0.18587493896484375, 0.1915283203125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 6.0, 5.0, 12.0, 15.0, 14.0, 19.0, 39.0, 71.0, 91.0, 141.0, 197.0, 314.0, 526.0, 1007.0, 2019.0, 5521.0, 22956.0, 216526.0, 737264.0, 46718.0, 9119.0, 2855.0, 1307.0, 661.0, 390.0, 246.0, 155.0, 126.0, 69.0, 43.0, 29.0, 23.0, 26.0, 11.0, 7.0, 11.0, 8.0, 5.0, 1.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.806640625, -0.783721923828125, -0.76080322265625, -0.737884521484375, -0.7149658203125, -0.692047119140625, -0.66912841796875, -0.646209716796875, -0.623291015625, -0.600372314453125, -0.57745361328125, -0.554534912109375, -0.5316162109375, -0.508697509765625, -0.48577880859375, -0.462860107421875, -0.43994140625, -0.417022705078125, -0.39410400390625, -0.371185302734375, -0.3482666015625, -0.325347900390625, -0.30242919921875, -0.279510498046875, -0.256591796875, -0.233673095703125, -0.21075439453125, -0.187835693359375, -0.1649169921875, -0.141998291015625, -0.11907958984375, -0.096160888671875, -0.0732421875, -0.050323486328125, -0.02740478515625, -0.004486083984375, 0.0184326171875, 0.041351318359375, 0.06427001953125, 0.087188720703125, 0.110107421875, 0.133026123046875, 0.15594482421875, 0.178863525390625, 0.2017822265625, 0.224700927734375, 0.24761962890625, 0.270538330078125, 0.29345703125, 0.316375732421875, 0.33929443359375, 0.362213134765625, 0.3851318359375, 0.408050537109375, 0.43096923828125, 0.453887939453125, 0.476806640625, 0.499725341796875, 0.52264404296875, 0.545562744140625, 0.5684814453125, 0.591400146484375, 0.61431884765625, 0.637237548828125, 0.66015625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 4.0, 1.0, 10.0, 4.0, 8.0, 5.0, 4.0, 8.0, 10.0, 9.0, 17.0, 12.0, 16.0, 19.0, 22.0, 29.0, 33.0, 23.0, 34.0, 27.0, 38.0, 53.0, 45.0, 50.0, 44.0, 38.0, 45.0, 46.0, 41.0, 46.0, 31.0, 30.0, 27.0, 29.0, 26.0, 13.0, 13.0, 14.0, 10.0, 10.0, 7.0, 15.0, 7.0, 8.0, 2.0, 1.0, 5.0, 3.0, 2.0, 2.0, 2.0, 0.0, 4.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.55126953125, -0.5335311889648438, -0.5157928466796875, -0.49805450439453125, -0.480316162109375, -0.46257781982421875, -0.4448394775390625, -0.42710113525390625, -0.40936279296875, -0.39162445068359375, -0.3738861083984375, -0.35614776611328125, -0.338409423828125, -0.32067108154296875, -0.3029327392578125, -0.28519439697265625, -0.2674560546875, -0.24971771240234375, -0.2319793701171875, -0.21424102783203125, -0.196502685546875, -0.17876434326171875, -0.1610260009765625, -0.14328765869140625, -0.12554931640625, -0.10781097412109375, -0.0900726318359375, -0.07233428955078125, -0.054595947265625, -0.03685760498046875, -0.0191192626953125, -0.00138092041015625, 0.016357421875, 0.03409576416015625, 0.0518341064453125, 0.06957244873046875, 0.087310791015625, 0.10504913330078125, 0.1227874755859375, 0.14052581787109375, 0.15826416015625, 0.17600250244140625, 0.1937408447265625, 0.21147918701171875, 0.229217529296875, 0.24695587158203125, 0.2646942138671875, 0.28243255615234375, 0.3001708984375, 0.31790924072265625, 0.3356475830078125, 0.35338592529296875, 0.371124267578125, 0.38886260986328125, 0.4066009521484375, 0.42433929443359375, 0.44207763671875, 0.45981597900390625, 0.4775543212890625, 0.49529266357421875, 0.513031005859375, 0.5307693481445312, 0.5485076904296875, 0.5662460327148438, 0.583984375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 2.0, 6.0, 5.0, 4.0, 8.0, 10.0, 17.0, 15.0, 21.0, 31.0, 31.0, 56.0, 100.0, 158.0, 263.0, 528.0, 1052.0, 2652.0, 7726.0, 28807.0, 154564.0, 704144.0, 114105.0, 23384.0, 6454.0, 2268.0, 950.0, 475.0, 258.0, 140.0, 103.0, 58.0, 44.0, 32.0, 25.0, 21.0, 9.0, 9.0, 7.0, 3.0, 2.0, 3.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.264404296875, -0.2571449279785156, -0.24988555908203125, -0.24262619018554688, -0.2353668212890625, -0.22810745239257812, -0.22084808349609375, -0.21358871459960938, -0.206329345703125, -0.19906997680664062, -0.19181060791015625, -0.18455123901367188, -0.1772918701171875, -0.17003250122070312, -0.16277313232421875, -0.15551376342773438, -0.14825439453125, -0.14099502563476562, -0.13373565673828125, -0.12647628784179688, -0.1192169189453125, -0.11195755004882812, -0.10469818115234375, -0.09743881225585938, -0.090179443359375, -0.08292007446289062, -0.07566070556640625, -0.06840133666992188, -0.0611419677734375, -0.053882598876953125, -0.04662322998046875, -0.039363861083984375, -0.0321044921875, -0.024845123291015625, -0.01758575439453125, -0.010326385498046875, -0.0030670166015625, 0.004192352294921875, 0.01145172119140625, 0.018711090087890625, 0.025970458984375, 0.033229827880859375, 0.04048919677734375, 0.047748565673828125, 0.0550079345703125, 0.062267303466796875, 0.06952667236328125, 0.07678604125976562, 0.08404541015625, 0.09130477905273438, 0.09856414794921875, 0.10582351684570312, 0.1130828857421875, 0.12034225463867188, 0.12760162353515625, 0.13486099243164062, 0.142120361328125, 0.14937973022460938, 0.15663909912109375, 0.16389846801757812, 0.1711578369140625, 0.17841720581054688, 0.18567657470703125, 0.19293594360351562, 0.2001953125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 2.0, 4.0, 6.0, 9.0, 0.0, 8.0, 4.0, 21.0, 19.0, 20.0, 30.0, 25.0, 50.0, 60.0, 83.0, 111.0, 100.0, 91.0, 82.0, 62.0, 41.0, 34.0, 37.0, 22.0, 18.0, 15.0, 6.0, 7.0, 11.0, 5.0, 4.0, 2.0, 1.0, 5.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.147954940795898e-05, -7.905811071395874e-05, -7.66366720199585e-05, -7.421523332595825e-05, -7.179379463195801e-05, -6.937235593795776e-05, -6.695091724395752e-05, -6.452947854995728e-05, -6.210803985595703e-05, -5.968660116195679e-05, -5.726516246795654e-05, -5.48437237739563e-05, -5.2422285079956055e-05, -5.000084638595581e-05, -4.7579407691955566e-05, -4.515796899795532e-05, -4.273653030395508e-05, -4.0315091609954834e-05, -3.789365291595459e-05, -3.5472214221954346e-05, -3.30507755279541e-05, -3.062933683395386e-05, -2.8207898139953613e-05, -2.578645944595337e-05, -2.3365020751953125e-05, -2.094358205795288e-05, -1.8522143363952637e-05, -1.6100704669952393e-05, -1.3679265975952148e-05, -1.1257827281951904e-05, -8.83638858795166e-06, -6.414949893951416e-06, -3.993511199951172e-06, -1.5720725059509277e-06, 8.493661880493164e-07, 3.2708048820495605e-06, 5.692243576049805e-06, 8.113682270050049e-06, 1.0535120964050293e-05, 1.2956559658050537e-05, 1.537799835205078e-05, 1.7799437046051025e-05, 2.022087574005127e-05, 2.2642314434051514e-05, 2.5063753128051758e-05, 2.7485191822052002e-05, 2.9906630516052246e-05, 3.232806921005249e-05, 3.4749507904052734e-05, 3.717094659805298e-05, 3.959238529205322e-05, 4.201382398605347e-05, 4.443526268005371e-05, 4.6856701374053955e-05, 4.92781400680542e-05, 5.169957876205444e-05, 5.412101745605469e-05, 5.654245615005493e-05, 5.8963894844055176e-05, 6.138533353805542e-05, 6.380677223205566e-05, 6.622821092605591e-05, 6.864964962005615e-05, 7.10710883140564e-05, 7.349252700805664e-05]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 4.0, 6.0, 10.0, 13.0, 16.0, 20.0, 24.0, 49.0, 48.0, 91.0, 119.0, 195.0, 277.0, 483.0, 827.0, 1516.0, 3131.0, 7155.0, 21365.0, 89115.0, 639993.0, 221478.0, 41106.0, 11924.0, 4589.0, 2075.0, 1073.0, 712.0, 373.0, 242.0, 173.0, 120.0, 61.0, 48.0, 27.0, 32.0, 12.0, 16.0, 7.0, 7.0, 7.0, 3.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.2056884765625, -0.19940757751464844, -0.19312667846679688, -0.1868457794189453, -0.18056488037109375, -0.1742839813232422, -0.16800308227539062, -0.16172218322753906, -0.1554412841796875, -0.14916038513183594, -0.14287948608398438, -0.1365985870361328, -0.13031768798828125, -0.12403678894042969, -0.11775588989257812, -0.11147499084472656, -0.105194091796875, -0.09891319274902344, -0.09263229370117188, -0.08635139465332031, -0.08007049560546875, -0.07378959655761719, -0.06750869750976562, -0.06122779846191406, -0.0549468994140625, -0.04866600036621094, -0.042385101318359375, -0.03610420227050781, -0.02982330322265625, -0.023542404174804688, -0.017261505126953125, -0.010980606079101562, -0.00469970703125, 0.0015811920166015625, 0.007862091064453125, 0.014142990112304688, 0.02042388916015625, 0.026704788208007812, 0.032985687255859375, 0.03926658630371094, 0.0455474853515625, 0.05182838439941406, 0.058109283447265625, 0.06439018249511719, 0.07067108154296875, 0.07695198059082031, 0.08323287963867188, 0.08951377868652344, 0.095794677734375, 0.10207557678222656, 0.10835647583007812, 0.11463737487792969, 0.12091827392578125, 0.1271991729736328, 0.13348007202148438, 0.13976097106933594, 0.1460418701171875, 0.15232276916503906, 0.15860366821289062, 0.1648845672607422, 0.17116546630859375, 0.1774463653564453, 0.18372726440429688, 0.19000816345214844, 0.1962890625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 3.0, 6.0, 2.0, 8.0, 4.0, 9.0, 16.0, 13.0, 15.0, 26.0, 35.0, 38.0, 47.0, 76.0, 87.0, 114.0, 118.0, 97.0, 57.0, 51.0, 38.0, 22.0, 24.0, 24.0, 18.0, 15.0, 10.0, 9.0, 4.0, 7.0, 6.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.189453125, -0.18309783935546875, -0.1767425537109375, -0.17038726806640625, -0.164031982421875, -0.15767669677734375, -0.1513214111328125, -0.14496612548828125, -0.13861083984375, -0.13225555419921875, -0.1259002685546875, -0.11954498291015625, -0.113189697265625, -0.10683441162109375, -0.1004791259765625, -0.09412384033203125, -0.0877685546875, -0.08141326904296875, -0.0750579833984375, -0.06870269775390625, -0.062347412109375, -0.05599212646484375, -0.0496368408203125, -0.04328155517578125, -0.03692626953125, -0.03057098388671875, -0.0242156982421875, -0.01786041259765625, -0.011505126953125, -0.00514984130859375, 0.0012054443359375, 0.00756072998046875, 0.013916015625, 0.02027130126953125, 0.0266265869140625, 0.03298187255859375, 0.039337158203125, 0.04569244384765625, 0.0520477294921875, 0.05840301513671875, 0.06475830078125, 0.07111358642578125, 0.0774688720703125, 0.08382415771484375, 0.090179443359375, 0.09653472900390625, 0.1028900146484375, 0.10924530029296875, 0.1156005859375, 0.12195587158203125, 0.1283111572265625, 0.13466644287109375, 0.141021728515625, 0.14737701416015625, 0.1537322998046875, 0.16008758544921875, 0.16644287109375, 0.17279815673828125, 0.1791534423828125, 0.18550872802734375, 0.191864013671875, 0.19821929931640625, 0.2045745849609375, 0.21092987060546875, 0.21728515625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 7.0, 5.0, 5.0, 8.0, 15.0, 46.0, 157.0, 328.0, 268.0, 101.0, 35.0, 7.0, 5.0, 6.0, 6.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.837558746337891, -6.629733562469482, -6.421907901763916, -6.214082717895508, -6.006257057189941, -5.798431873321533, -5.590606689453125, -5.382781028747559, -5.17495584487915, -4.967130661010742, -4.759305000305176, -4.551479816436768, -4.343654155731201, -4.135828971862793, -3.9280035495758057, -3.7201781272888184, -3.512352705001831, -3.3045272827148438, -3.0967018604278564, -2.888876438140869, -2.681051254272461, -2.4732258319854736, -2.2654004096984863, -2.057575225830078, -1.8497496843338013, -1.641924262046814, -1.4340989589691162, -1.226273536682129, -1.0184481143951416, -0.8106228113174438, -0.6027973890304565, -0.3949720859527588, -0.18714666366577148, 0.02067871391773224, 0.22850409150123596, 0.4363294839859009, 0.6441548466682434, 0.8519802093505859, 1.0598056316375732, 1.267630934715271, 1.4754563570022583, 1.6832817792892456, 1.8911070823669434, 2.0989325046539307, 2.306757926940918, 2.514583110809326, 2.7224087715148926, 2.930233955383301, 3.138059377670288, 3.3458847999572754, 3.5537102222442627, 3.76153564453125, 3.969360828399658, 4.177186012268066, 4.385011672973633, 4.592836856842041, 4.800662517547607, 5.008487701416016, 5.216313362121582, 5.42413854598999, 5.631964206695557, 5.839789390563965, 6.047615051269531, 6.2554402351379395, 6.463265419006348]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 3.0, 11.0, 8.0, 7.0, 12.0, 12.0, 16.0, 15.0, 17.0, 29.0, 29.0, 36.0, 32.0, 28.0, 44.0, 40.0, 71.0, 67.0, 66.0, 58.0, 67.0, 38.0, 41.0, 38.0, 29.0, 27.0, 21.0, 24.0, 21.0, 20.0, 18.0, 4.0, 16.0, 7.0, 9.0, 4.0, 5.0, 3.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.346055030822754, -2.266205310821533, -2.1863555908203125, -2.106505870819092, -2.026656150817871, -1.9468064308166504, -1.8669567108154297, -1.787106990814209, -1.7072572708129883, -1.6274075508117676, -1.5475578308105469, -1.4677081108093262, -1.3878583908081055, -1.3080086708068848, -1.228158950805664, -1.1483092308044434, -1.0684596300125122, -0.9886099100112915, -0.9087601900100708, -0.8289104700088501, -0.7490607500076294, -0.6692110300064087, -0.5893613696098328, -0.5095116496086121, -0.42966192960739136, -0.34981220960617065, -0.26996248960494995, -0.19011279940605164, -0.11026307940483093, -0.03041335940361023, 0.049436330795288086, 0.1292860507965088, 0.2091357707977295, 0.2889854907989502, 0.3688352108001709, 0.4486849009990692, 0.5285346508026123, 0.608384370803833, 0.6882340312004089, 0.7680837512016296, 0.8479334712028503, 0.927783191204071, 1.007632851600647, 1.0874825716018677, 1.1673322916030884, 1.247182011604309, 1.3270317316055298, 1.4068814516067505, 1.4867311716079712, 1.566580891609192, 1.6464306116104126, 1.7262803316116333, 1.806130051612854, 1.8859797716140747, 1.9658293724060059, 2.0456790924072266, 2.1255288124084473, 2.205378532409668, 2.2852282524108887, 2.3650779724121094, 2.44492769241333, 2.524777412414551, 2.6046271324157715, 2.684476852416992, 2.764326572418213]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 8.0, 4.0, 15.0, 10.0, 16.0, 25.0, 33.0, 42.0, 62.0, 131.0, 287.0, 611.0, 1641.0, 5344.0, 21855.0, 145670.0, 2388782.0, 1514496.0, 92551.0, 16034.0, 4172.0, 1379.0, 508.0, 246.0, 121.0, 66.0, 50.0, 33.0, 22.0, 16.0, 14.0, 9.0, 5.0, 4.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.376953125, -0.3661537170410156, -0.35535430908203125, -0.3445549011230469, -0.3337554931640625, -0.3229560852050781, -0.31215667724609375, -0.3013572692871094, -0.290557861328125, -0.2797584533691406, -0.26895904541015625, -0.2581596374511719, -0.2473602294921875, -0.23656082153320312, -0.22576141357421875, -0.21496200561523438, -0.20416259765625, -0.19336318969726562, -0.18256378173828125, -0.17176437377929688, -0.1609649658203125, -0.15016555786132812, -0.13936614990234375, -0.12856674194335938, -0.117767333984375, -0.10696792602539062, -0.09616851806640625, -0.08536911010742188, -0.0745697021484375, -0.06377029418945312, -0.05297088623046875, -0.042171478271484375, -0.0313720703125, -0.020572662353515625, -0.00977325439453125, 0.001026153564453125, 0.0118255615234375, 0.022624969482421875, 0.03342437744140625, 0.044223785400390625, 0.055023193359375, 0.06582260131835938, 0.07662200927734375, 0.08742141723632812, 0.0982208251953125, 0.10902023315429688, 0.11981964111328125, 0.13061904907226562, 0.14141845703125, 0.15221786499023438, 0.16301727294921875, 0.17381668090820312, 0.1846160888671875, 0.19541549682617188, 0.20621490478515625, 0.21701431274414062, 0.227813720703125, 0.23861312866210938, 0.24941253662109375, 0.2602119445800781, 0.2710113525390625, 0.2818107604980469, 0.29261016845703125, 0.3034095764160156, 0.314208984375]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 4.0, 2.0, 10.0, 9.0, 8.0, 8.0, 10.0, 16.0, 16.0, 20.0, 30.0, 24.0, 35.0, 35.0, 37.0, 44.0, 36.0, 49.0, 32.0, 48.0, 64.0, 53.0, 43.0, 46.0, 38.0, 28.0, 37.0, 29.0, 32.0, 26.0, 29.0, 18.0, 14.0, 16.0, 10.0, 10.0, 6.0, 9.0, 5.0, 4.0, 2.0, 2.0, 1.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.11444091796875, -0.11026477813720703, -0.10608863830566406, -0.1019124984741211, -0.09773635864257812, -0.09356021881103516, -0.08938407897949219, -0.08520793914794922, -0.08103179931640625, -0.07685565948486328, -0.07267951965332031, -0.06850337982177734, -0.06432723999023438, -0.060151100158691406, -0.05597496032714844, -0.05179882049560547, -0.0476226806640625, -0.04344654083251953, -0.03927040100097656, -0.035094261169433594, -0.030918121337890625, -0.026741981506347656, -0.022565841674804688, -0.01838970184326172, -0.01421356201171875, -0.010037422180175781, -0.0058612823486328125, -0.0016851425170898438, 0.002490997314453125, 0.006667137145996094, 0.010843276977539062, 0.015019416809082031, 0.019195556640625, 0.02337169647216797, 0.027547836303710938, 0.031723976135253906, 0.035900115966796875, 0.040076255798339844, 0.04425239562988281, 0.04842853546142578, 0.05260467529296875, 0.05678081512451172, 0.06095695495605469, 0.06513309478759766, 0.06930923461914062, 0.0734853744506836, 0.07766151428222656, 0.08183765411376953, 0.0860137939453125, 0.09018993377685547, 0.09436607360839844, 0.0985422134399414, 0.10271835327148438, 0.10689449310302734, 0.11107063293457031, 0.11524677276611328, 0.11942291259765625, 0.12359905242919922, 0.1277751922607422, 0.13195133209228516, 0.13612747192382812, 0.1403036117553711, 0.14447975158691406, 0.14865589141845703, 0.15283203125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 5.0, 4.0, 9.0, 13.0, 18.0, 17.0, 31.0, 50.0, 84.0, 183.0, 386.0, 917.0, 2562.0, 9569.0, 65802.0, 1562390.0, 2442958.0, 92214.0, 12039.0, 2996.0, 1038.0, 477.0, 207.0, 124.0, 52.0, 46.0, 22.0, 19.0, 11.0, 12.0, 9.0, 2.0, 6.0, 1.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6044921875, -0.5881843566894531, -0.5718765258789062, -0.5555686950683594, -0.5392608642578125, -0.5229530334472656, -0.5066452026367188, -0.4903373718261719, -0.474029541015625, -0.4577217102050781, -0.44141387939453125, -0.4251060485839844, -0.4087982177734375, -0.3924903869628906, -0.37618255615234375, -0.3598747253417969, -0.34356689453125, -0.3272590637207031, -0.31095123291015625, -0.2946434020996094, -0.2783355712890625, -0.2620277404785156, -0.24571990966796875, -0.22941207885742188, -0.213104248046875, -0.19679641723632812, -0.18048858642578125, -0.16418075561523438, -0.1478729248046875, -0.13156509399414062, -0.11525726318359375, -0.09894943237304688, -0.0826416015625, -0.06633377075195312, -0.05002593994140625, -0.033718109130859375, -0.0174102783203125, -0.001102447509765625, 0.01520538330078125, 0.031513214111328125, 0.047821044921875, 0.06412887573242188, 0.08043670654296875, 0.09674453735351562, 0.1130523681640625, 0.12936019897460938, 0.14566802978515625, 0.16197586059570312, 0.17828369140625, 0.19459152221679688, 0.21089935302734375, 0.22720718383789062, 0.2435150146484375, 0.2598228454589844, 0.27613067626953125, 0.2924385070800781, 0.308746337890625, 0.3250541687011719, 0.34136199951171875, 0.3576698303222656, 0.3739776611328125, 0.3902854919433594, 0.40659332275390625, 0.4229011535644531, 0.439208984375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 4.0, 9.0, 10.0, 11.0, 18.0, 21.0, 29.0, 57.0, 71.0, 109.0, 165.0, 245.0, 417.0, 629.0, 659.0, 574.0, 357.0, 225.0, 138.0, 116.0, 74.0, 36.0, 34.0, 18.0, 15.0, 9.0, 11.0, 3.0, 4.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3876953125, -0.3744850158691406, -0.36127471923828125, -0.3480644226074219, -0.3348541259765625, -0.3216438293457031, -0.30843353271484375, -0.2952232360839844, -0.282012939453125, -0.2688026428222656, -0.25559234619140625, -0.24238204956054688, -0.2291717529296875, -0.21596145629882812, -0.20275115966796875, -0.18954086303710938, -0.17633056640625, -0.16312026977539062, -0.14990997314453125, -0.13669967651367188, -0.1234893798828125, -0.11027908325195312, -0.09706878662109375, -0.08385848999023438, -0.070648193359375, -0.057437896728515625, -0.04422760009765625, -0.031017303466796875, -0.0178070068359375, -0.004596710205078125, 0.00861358642578125, 0.021823883056640625, 0.0350341796875, 0.048244476318359375, 0.06145477294921875, 0.07466506958007812, 0.0878753662109375, 0.10108566284179688, 0.11429595947265625, 0.12750625610351562, 0.140716552734375, 0.15392684936523438, 0.16713714599609375, 0.18034744262695312, 0.1935577392578125, 0.20676803588867188, 0.21997833251953125, 0.23318862915039062, 0.24639892578125, 0.2596092224121094, 0.27281951904296875, 0.2860298156738281, 0.2992401123046875, 0.3124504089355469, 0.32566070556640625, 0.3388710021972656, 0.352081298828125, 0.3652915954589844, 0.37850189208984375, 0.3917121887207031, 0.4049224853515625, 0.4181327819824219, 0.43134307861328125, 0.4445533752441406, 0.457763671875]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 11.0, 7.0, 15.0, 24.0, 75.0, 145.0, 234.0, 268.0, 119.0, 54.0, 20.0, 10.0, 6.0, 5.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-6.050366401672363, -5.881232261657715, -5.712097644805908, -5.542963027954102, -5.373828887939453, -5.204694747924805, -5.035560131072998, -4.866425514221191, -4.697291374206543, -4.5281572341918945, -4.359022617340088, -4.189888000488281, -4.020753860473633, -3.8516194820404053, -3.6824851036071777, -3.51335072517395, -3.3442163467407227, -3.175081968307495, -3.0059475898742676, -2.83681321144104, -2.6676788330078125, -2.498544454574585, -2.3294100761413574, -2.16027569770813, -1.9911413192749023, -1.8220069408416748, -1.6528725624084473, -1.4837381839752197, -1.3146038055419922, -1.1454694271087646, -0.9763350486755371, -0.8072006702423096, -0.6380658149719238, -0.4689314365386963, -0.29979705810546875, -0.1306626796722412, 0.03847169876098633, 0.20760607719421387, 0.3767404556274414, 0.545874834060669, 0.7150092124938965, 0.884143590927124, 1.0532779693603516, 1.222412347793579, 1.3915467262268066, 1.5606811046600342, 1.7298154830932617, 1.8989498615264893, 2.068084239959717, 2.2372186183929443, 2.406352996826172, 2.5754873752593994, 2.744621753692627, 2.9137561321258545, 3.082890510559082, 3.2520248889923096, 3.421159267425537, 3.5902936458587646, 3.759428024291992, 3.9285624027252197, 4.097696781158447, 4.266831398010254, 4.435965538024902, 4.605099678039551, 4.774234294891357]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 7.0, 4.0, 6.0, 12.0, 32.0, 22.0, 23.0, 39.0, 51.0, 60.0, 56.0, 76.0, 83.0, 68.0, 63.0, 70.0, 58.0, 61.0, 49.0, 41.0, 34.0, 21.0, 20.0, 15.0, 11.0, 8.0, 5.0, 6.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8514225482940674, -2.7698893547058105, -2.6883559226989746, -2.6068227291107178, -2.525289297103882, -2.443756103515625, -2.362222671508789, -2.2806894779205322, -2.1991562843322754, -2.1176230907440186, -2.0360896587371826, -1.9545563459396362, -1.8730230331420898, -1.791489839553833, -1.7099565267562866, -1.6284232139587402, -1.5468897819519043, -1.465356469154358, -1.3838231563568115, -1.3022898435592651, -1.2207565307617188, -1.139223337173462, -1.0576900243759155, -0.9761567115783691, -0.8946233987808228, -0.8130900859832764, -0.73155677318573, -0.6500235199928284, -0.568490207195282, -0.4869568943977356, -0.4054236114025116, -0.3238903284072876, -0.2423572540283203, -0.16082395613193512, -0.07929065823554993, 0.002242639660835266, 0.08377593755722046, 0.16530925035476685, 0.24684253334999084, 0.32837581634521484, 0.40990912914276123, 0.4914424419403076, 0.572975754737854, 0.6545090079307556, 0.736042320728302, 0.8175756335258484, 0.89910888671875, 0.9806421995162964, 1.0621755123138428, 1.1437088251113892, 1.2252421379089355, 1.306775450706482, 1.3883087635040283, 1.4698419570922852, 1.5513752698898315, 1.632908582687378, 1.7144418954849243, 1.7959752082824707, 1.877508521080017, 1.9590418338775635, 2.0405750274658203, 2.1221084594726562, 2.203641653060913, 2.28517484664917, 2.366708278656006]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 6.0, 6.0, 6.0, 10.0, 8.0, 8.0, 13.0, 19.0, 28.0, 53.0, 73.0, 110.0, 229.0, 435.0, 868.0, 1704.0, 3894.0, 10015.0, 37642.0, 233447.0, 573683.0, 146493.0, 25954.0, 7733.0, 3159.0, 1415.0, 691.0, 355.0, 205.0, 91.0, 62.0, 47.0, 31.0, 18.0, 11.0, 12.0, 6.0, 4.0, 6.0, 4.0, 6.0, 1.0, 2.0, 3.0, 1.0, 1.0], "bins": [-0.399658203125, -0.38924407958984375, -0.3788299560546875, -0.36841583251953125, -0.358001708984375, -0.34758758544921875, -0.3371734619140625, -0.32675933837890625, -0.31634521484375, -0.30593109130859375, -0.2955169677734375, -0.28510284423828125, -0.274688720703125, -0.26427459716796875, -0.2538604736328125, -0.24344635009765625, -0.2330322265625, -0.22261810302734375, -0.2122039794921875, -0.20178985595703125, -0.191375732421875, -0.18096160888671875, -0.1705474853515625, -0.16013336181640625, -0.14971923828125, -0.13930511474609375, -0.1288909912109375, -0.11847686767578125, -0.108062744140625, -0.09764862060546875, -0.0872344970703125, -0.07682037353515625, -0.06640625, -0.05599212646484375, -0.0455780029296875, -0.03516387939453125, -0.024749755859375, -0.01433563232421875, -0.0039215087890625, 0.00649261474609375, 0.01690673828125, 0.02732086181640625, 0.0377349853515625, 0.04814910888671875, 0.058563232421875, 0.06897735595703125, 0.0793914794921875, 0.08980560302734375, 0.1002197265625, 0.11063385009765625, 0.1210479736328125, 0.13146209716796875, 0.141876220703125, 0.15229034423828125, 0.1627044677734375, 0.17311859130859375, 0.18353271484375, 0.19394683837890625, 0.2043609619140625, 0.21477508544921875, 0.225189208984375, 0.23560333251953125, 0.2460174560546875, 0.25643157958984375, 0.266845703125]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 8.0, 8.0, 5.0, 6.0, 11.0, 11.0, 10.0, 15.0, 29.0, 26.0, 19.0, 26.0, 39.0, 38.0, 40.0, 34.0, 41.0, 53.0, 41.0, 48.0, 40.0, 42.0, 44.0, 40.0, 39.0, 48.0, 38.0, 24.0, 27.0, 18.0, 22.0, 22.0, 16.0, 12.0, 17.0, 6.0, 9.0, 9.0, 6.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.1397705078125, -0.1353759765625, -0.1309814453125, -0.1265869140625, -0.1221923828125, -0.1177978515625, -0.1134033203125, -0.1090087890625, -0.1046142578125, -0.1002197265625, -0.0958251953125, -0.0914306640625, -0.0870361328125, -0.0826416015625, -0.0782470703125, -0.0738525390625, -0.0694580078125, -0.0650634765625, -0.0606689453125, -0.0562744140625, -0.0518798828125, -0.0474853515625, -0.0430908203125, -0.0386962890625, -0.0343017578125, -0.0299072265625, -0.0255126953125, -0.0211181640625, -0.0167236328125, -0.0123291015625, -0.0079345703125, -0.0035400390625, 0.0008544921875, 0.0052490234375, 0.0096435546875, 0.0140380859375, 0.0184326171875, 0.0228271484375, 0.0272216796875, 0.0316162109375, 0.0360107421875, 0.0404052734375, 0.0447998046875, 0.0491943359375, 0.0535888671875, 0.0579833984375, 0.0623779296875, 0.0667724609375, 0.0711669921875, 0.0755615234375, 0.0799560546875, 0.0843505859375, 0.0887451171875, 0.0931396484375, 0.0975341796875, 0.1019287109375, 0.1063232421875, 0.1107177734375, 0.1151123046875, 0.1195068359375, 0.1239013671875, 0.1282958984375, 0.1326904296875, 0.1370849609375, 0.1414794921875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 5.0, 7.0, 10.0, 6.0, 14.0, 22.0, 40.0, 64.0, 97.0, 197.0, 418.0, 953.0, 2952.0, 13145.0, 192070.0, 787938.0, 42193.0, 5597.0, 1604.0, 573.0, 269.0, 162.0, 75.0, 57.0, 33.0, 13.0, 15.0, 8.0, 7.0, 6.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4384765625, -0.421112060546875, -0.40374755859375, -0.386383056640625, -0.3690185546875, -0.351654052734375, -0.33428955078125, -0.316925048828125, -0.299560546875, -0.282196044921875, -0.26483154296875, -0.247467041015625, -0.2301025390625, -0.212738037109375, -0.19537353515625, -0.178009033203125, -0.16064453125, -0.143280029296875, -0.12591552734375, -0.108551025390625, -0.0911865234375, -0.073822021484375, -0.05645751953125, -0.039093017578125, -0.021728515625, -0.004364013671875, 0.01300048828125, 0.030364990234375, 0.0477294921875, 0.065093994140625, 0.08245849609375, 0.099822998046875, 0.1171875, 0.134552001953125, 0.15191650390625, 0.169281005859375, 0.1866455078125, 0.204010009765625, 0.22137451171875, 0.238739013671875, 0.256103515625, 0.273468017578125, 0.29083251953125, 0.308197021484375, 0.3255615234375, 0.342926025390625, 0.36029052734375, 0.377655029296875, 0.39501953125, 0.412384033203125, 0.42974853515625, 0.447113037109375, 0.4644775390625, 0.481842041015625, 0.49920654296875, 0.516571044921875, 0.533935546875, 0.551300048828125, 0.56866455078125, 0.586029052734375, 0.6033935546875, 0.620758056640625, 0.63812255859375, 0.655487060546875, 0.6728515625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 8.0, 4.0, 7.0, 6.0, 9.0, 8.0, 15.0, 11.0, 23.0, 24.0, 13.0, 29.0, 39.0, 31.0, 41.0, 44.0, 43.0, 45.0, 57.0, 51.0, 53.0, 53.0, 38.0, 47.0, 41.0, 39.0, 22.0, 26.0, 33.0, 23.0, 23.0, 14.0, 16.0, 13.0, 17.0, 8.0, 7.0, 5.0, 6.0, 8.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.5791015625, -0.5621871948242188, -0.5452728271484375, -0.5283584594726562, -0.511444091796875, -0.49452972412109375, -0.4776153564453125, -0.46070098876953125, -0.44378662109375, -0.42687225341796875, -0.4099578857421875, -0.39304351806640625, -0.376129150390625, -0.35921478271484375, -0.3423004150390625, -0.32538604736328125, -0.3084716796875, -0.29155731201171875, -0.2746429443359375, -0.25772857666015625, -0.240814208984375, -0.22389984130859375, -0.2069854736328125, -0.19007110595703125, -0.17315673828125, -0.15624237060546875, -0.1393280029296875, -0.12241363525390625, -0.105499267578125, -0.08858489990234375, -0.0716705322265625, -0.05475616455078125, -0.037841796875, -0.02092742919921875, -0.0040130615234375, 0.01290130615234375, 0.029815673828125, 0.04673004150390625, 0.0636444091796875, 0.08055877685546875, 0.09747314453125, 0.11438751220703125, 0.1313018798828125, 0.14821624755859375, 0.165130615234375, 0.18204498291015625, 0.1989593505859375, 0.21587371826171875, 0.2327880859375, 0.24970245361328125, 0.2666168212890625, 0.28353118896484375, 0.300445556640625, 0.31735992431640625, 0.3342742919921875, 0.35118865966796875, 0.36810302734375, 0.38501739501953125, 0.4019317626953125, 0.41884613037109375, 0.435760498046875, 0.45267486572265625, 0.4695892333984375, 0.48650360107421875, 0.50341796875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 5.0, 10.0, 9.0, 24.0, 23.0, 28.0, 55.0, 65.0, 111.0, 192.0, 368.0, 624.0, 1454.0, 3241.0, 7488.0, 20955.0, 73703.0, 300826.0, 511000.0, 88318.0, 24669.0, 8674.0, 3438.0, 1582.0, 733.0, 376.0, 184.0, 151.0, 98.0, 54.0, 33.0, 13.0, 13.0, 15.0, 13.0, 9.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09912109375, -0.095458984375, -0.091796875, -0.088134765625, -0.08447265625, -0.080810546875, -0.0771484375, -0.073486328125, -0.06982421875, -0.066162109375, -0.0625, -0.058837890625, -0.05517578125, -0.051513671875, -0.0478515625, -0.044189453125, -0.04052734375, -0.036865234375, -0.033203125, -0.029541015625, -0.02587890625, -0.022216796875, -0.0185546875, -0.014892578125, -0.01123046875, -0.007568359375, -0.00390625, -0.000244140625, 0.00341796875, 0.007080078125, 0.0107421875, 0.014404296875, 0.01806640625, 0.021728515625, 0.025390625, 0.029052734375, 0.03271484375, 0.036376953125, 0.0400390625, 0.043701171875, 0.04736328125, 0.051025390625, 0.0546875, 0.058349609375, 0.06201171875, 0.065673828125, 0.0693359375, 0.072998046875, 0.07666015625, 0.080322265625, 0.083984375, 0.087646484375, 0.09130859375, 0.094970703125, 0.0986328125, 0.102294921875, 0.10595703125, 0.109619140625, 0.11328125, 0.116943359375, 0.12060546875, 0.124267578125, 0.1279296875, 0.131591796875, 0.13525390625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 5.0, 6.0, 3.0, 6.0, 8.0, 5.0, 7.0, 21.0, 18.0, 27.0, 46.0, 60.0, 60.0, 75.0, 89.0, 93.0, 94.0, 77.0, 64.0, 58.0, 45.0, 29.0, 21.0, 29.0, 13.0, 13.0, 11.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-5.817413330078125e-05, -5.659274756908417e-05, -5.5011361837387085e-05, -5.342997610569e-05, -5.184859037399292e-05, -5.026720464229584e-05, -4.8685818910598755e-05, -4.710443317890167e-05, -4.552304744720459e-05, -4.394166171550751e-05, -4.2360275983810425e-05, -4.077889025211334e-05, -3.919750452041626e-05, -3.761611878871918e-05, -3.6034733057022095e-05, -3.445334732532501e-05, -3.287196159362793e-05, -3.129057586193085e-05, -2.9709190130233765e-05, -2.8127804398536682e-05, -2.65464186668396e-05, -2.4965032935142517e-05, -2.3383647203445435e-05, -2.1802261471748352e-05, -2.022087574005127e-05, -1.8639490008354187e-05, -1.7058104276657104e-05, -1.5476718544960022e-05, -1.389533281326294e-05, -1.2313947081565857e-05, -1.0732561349868774e-05, -9.151175618171692e-06, -7.569789886474609e-06, -5.988404154777527e-06, -4.407018423080444e-06, -2.825632691383362e-06, -1.2442469596862793e-06, 3.371387720108032e-07, 1.9185245037078857e-06, 3.4999102354049683e-06, 5.081295967102051e-06, 6.662681698799133e-06, 8.244067430496216e-06, 9.825453162193298e-06, 1.1406838893890381e-05, 1.2988224625587463e-05, 1.4569610357284546e-05, 1.615099608898163e-05, 1.773238182067871e-05, 1.9313767552375793e-05, 2.0895153284072876e-05, 2.247653901576996e-05, 2.405792474746704e-05, 2.5639310479164124e-05, 2.7220696210861206e-05, 2.880208194255829e-05, 3.038346767425537e-05, 3.1964853405952454e-05, 3.3546239137649536e-05, 3.512762486934662e-05, 3.67090106010437e-05, 3.8290396332740784e-05, 3.9871782064437866e-05, 4.145316779613495e-05, 4.303455352783203e-05]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 4.0, 7.0, 8.0, 9.0, 17.0, 32.0, 50.0, 74.0, 149.0, 305.0, 707.0, 2069.0, 8154.0, 49308.0, 602710.0, 337911.0, 37503.0, 6521.0, 1806.0, 614.0, 286.0, 132.0, 88.0, 32.0, 22.0, 15.0, 11.0, 9.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18359375, -0.1772480010986328, -0.17090225219726562, -0.16455650329589844, -0.15821075439453125, -0.15186500549316406, -0.14551925659179688, -0.1391735076904297, -0.1328277587890625, -0.1264820098876953, -0.12013626098632812, -0.11379051208496094, -0.10744476318359375, -0.10109901428222656, -0.09475326538085938, -0.08840751647949219, -0.082061767578125, -0.07571601867675781, -0.06937026977539062, -0.06302452087402344, -0.05667877197265625, -0.05033302307128906, -0.043987274169921875, -0.03764152526855469, -0.0312957763671875, -0.024950027465820312, -0.018604278564453125, -0.012258529663085938, -0.00591278076171875, 0.0004329681396484375, 0.006778717041015625, 0.013124465942382812, 0.01947021484375, 0.025815963745117188, 0.032161712646484375, 0.03850746154785156, 0.04485321044921875, 0.05119895935058594, 0.057544708251953125, 0.06389045715332031, 0.0702362060546875, 0.07658195495605469, 0.08292770385742188, 0.08927345275878906, 0.09561920166015625, 0.10196495056152344, 0.10831069946289062, 0.11465644836425781, 0.121002197265625, 0.1273479461669922, 0.13369369506835938, 0.14003944396972656, 0.14638519287109375, 0.15273094177246094, 0.15907669067382812, 0.1654224395751953, 0.1717681884765625, 0.1781139373779297, 0.18445968627929688, 0.19080543518066406, 0.19715118408203125, 0.20349693298339844, 0.20984268188476562, 0.2161884307861328, 0.2225341796875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 3.0, 2.0, 3.0, 4.0, 1.0, 3.0, 5.0, 16.0, 7.0, 14.0, 16.0, 17.0, 18.0, 23.0, 38.0, 37.0, 47.0, 73.0, 65.0, 74.0, 74.0, 95.0, 67.0, 55.0, 42.0, 38.0, 48.0, 26.0, 17.0, 13.0, 20.0, 12.0, 9.0, 5.0, 5.0, 2.0, 6.0, 2.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1212158203125, -0.11757659912109375, -0.1139373779296875, -0.11029815673828125, -0.106658935546875, -0.10301971435546875, -0.0993804931640625, -0.09574127197265625, -0.09210205078125, -0.08846282958984375, -0.0848236083984375, -0.08118438720703125, -0.077545166015625, -0.07390594482421875, -0.0702667236328125, -0.06662750244140625, -0.06298828125, -0.05934906005859375, -0.0557098388671875, -0.05207061767578125, -0.048431396484375, -0.04479217529296875, -0.0411529541015625, -0.03751373291015625, -0.03387451171875, -0.03023529052734375, -0.0265960693359375, -0.02295684814453125, -0.019317626953125, -0.01567840576171875, -0.0120391845703125, -0.00839996337890625, -0.0047607421875, -0.00112152099609375, 0.0025177001953125, 0.00615692138671875, 0.009796142578125, 0.01343536376953125, 0.0170745849609375, 0.02071380615234375, 0.02435302734375, 0.02799224853515625, 0.0316314697265625, 0.03527069091796875, 0.038909912109375, 0.04254913330078125, 0.0461883544921875, 0.04982757568359375, 0.053466796875, 0.05710601806640625, 0.0607452392578125, 0.06438446044921875, 0.068023681640625, 0.07166290283203125, 0.0753021240234375, 0.07894134521484375, 0.08258056640625, 0.08621978759765625, 0.0898590087890625, 0.09349822998046875, 0.097137451171875, 0.10077667236328125, 0.1044158935546875, 0.10805511474609375, 0.1116943359375]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 6.0, 3.0, 5.0, 3.0, 4.0, 3.0, 8.0, 9.0, 19.0, 40.0, 81.0, 111.0, 248.0, 181.0, 135.0, 78.0, 34.0, 12.0, 11.0, 3.0, 5.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.750999927520752, -2.6521968841552734, -2.553393840789795, -2.4545907974243164, -2.355787754058838, -2.2569847106933594, -2.158181667327881, -2.0593786239624023, -1.9605754613876343, -1.8617724180221558, -1.7629693746566772, -1.6641662120819092, -1.5653631687164307, -1.4665601253509521, -1.3677570819854736, -1.2689540386199951, -1.1701509952545166, -1.071347951889038, -0.9725449085235596, -0.8737418055534363, -0.7749387621879578, -0.6761357188224792, -0.577332615852356, -0.47852957248687744, -0.3797265291213989, -0.2809234857559204, -0.1821204125881195, -0.0833173394203186, 0.015485703945159912, 0.11428874731063843, 0.21309185028076172, 0.31189489364624023, 0.41069769859313965, 0.5095007419586182, 0.6083037853240967, 0.70710688829422, 0.8059099316596985, 0.904712975025177, 1.0035160779953003, 1.1023191213607788, 1.2011221647262573, 1.2999252080917358, 1.3987282514572144, 1.4975314140319824, 1.596334457397461, 1.6951375007629395, 1.793940544128418, 1.8927435874938965, 1.991546630859375, 2.0903496742248535, 2.189152717590332, 2.2879557609558105, 2.386758804321289, 2.4855618476867676, 2.584364891052246, 2.6831679344177246, 2.781970977783203, 2.8807740211486816, 2.97957706451416, 3.0783801078796387, 3.177183151245117, 3.2759861946105957, 3.374789237976074, 3.4735922813415527, 3.5723955631256104]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 5.0, 2.0, 6.0, 9.0, 9.0, 11.0, 16.0, 13.0, 30.0, 27.0, 29.0, 25.0, 43.0, 41.0, 50.0, 58.0, 78.0, 83.0, 89.0, 62.0, 49.0, 40.0, 32.0, 35.0, 21.0, 23.0, 25.0, 21.0, 14.0, 13.0, 15.0, 7.0, 6.0, 2.0, 4.0, 6.0, 1.0, 0.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5994820594787598, -2.5223748683929443, -2.445267677307129, -2.3681602478027344, -2.291053056716919, -2.2139458656311035, -2.136838674545288, -2.0597314834594727, -1.9826240539550781, -1.9055168628692627, -1.8284095525741577, -1.7513023614883423, -1.6741950511932373, -1.5970878601074219, -1.5199806690216064, -1.4428733587265015, -1.365766167640686, -1.2886589765548706, -1.2115516662597656, -1.1344444751739502, -1.0573371648788452, -0.9802299737930298, -0.9031227231025696, -0.8260154724121094, -0.7489082217216492, -0.671800971031189, -0.5946937203407288, -0.5175864696502686, -0.44047924876213074, -0.36337199807167053, -0.2862647771835327, -0.2091575264930725, -0.1320502758026123, -0.0549430325627327, 0.02216421067714691, 0.09927144646644592, 0.17637869715690613, 0.25348594784736633, 0.33059316873550415, 0.40770041942596436, 0.48480767011642456, 0.5619149208068848, 0.639022171497345, 0.7161294221878052, 0.7932366132736206, 0.8703439235687256, 0.947451114654541, 1.0245583057403564, 1.1016656160354614, 1.1787728071212769, 1.2558801174163818, 1.3329873085021973, 1.4100946187973022, 1.4872018098831177, 1.5643091201782227, 1.641416311264038, 1.7185235023498535, 1.795630693435669, 1.872738003730774, 1.9498451948165894, 2.0269525051116943, 2.1040596961975098, 2.181166887283325, 2.2582740783691406, 2.335381507873535]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 3.0, 3.0, 8.0, 3.0, 5.0, 6.0, 6.0, 8.0, 19.0, 16.0, 29.0, 37.0, 70.0, 156.0, 405.0, 1085.0, 4111.0, 19520.0, 168978.0, 2909569.0, 1017544.0, 59727.0, 9510.0, 2208.0, 721.0, 273.0, 108.0, 54.0, 21.0, 28.0, 19.0, 15.0, 4.0, 8.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.37939453125, -0.3684883117675781, -0.35758209228515625, -0.3466758728027344, -0.3357696533203125, -0.3248634338378906, -0.31395721435546875, -0.3030509948730469, -0.292144775390625, -0.2812385559082031, -0.27033233642578125, -0.2594261169433594, -0.2485198974609375, -0.23761367797851562, -0.22670745849609375, -0.21580123901367188, -0.20489501953125, -0.19398880004882812, -0.18308258056640625, -0.17217636108398438, -0.1612701416015625, -0.15036392211914062, -0.13945770263671875, -0.12855148315429688, -0.117645263671875, -0.10673904418945312, -0.09583282470703125, -0.08492660522460938, -0.0740203857421875, -0.06311416625976562, -0.05220794677734375, -0.041301727294921875, -0.0303955078125, -0.019489288330078125, -0.00858306884765625, 0.002323150634765625, 0.0132293701171875, 0.024135589599609375, 0.03504180908203125, 0.045948028564453125, 0.056854248046875, 0.06776046752929688, 0.07866668701171875, 0.08957290649414062, 0.1004791259765625, 0.11138534545898438, 0.12229156494140625, 0.13319778442382812, 0.14410400390625, 0.15501022338867188, 0.16591644287109375, 0.17682266235351562, 0.1877288818359375, 0.19863510131835938, 0.20954132080078125, 0.22044754028320312, 0.231353759765625, 0.24225997924804688, 0.25316619873046875, 0.2640724182128906, 0.2749786376953125, 0.2858848571777344, 0.29679107666015625, 0.3076972961425781, 0.318603515625]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 7.0, 1.0, 0.0, 3.0, 9.0, 4.0, 9.0, 6.0, 16.0, 15.0, 21.0, 29.0, 34.0, 33.0, 36.0, 35.0, 42.0, 42.0, 59.0, 52.0, 54.0, 46.0, 46.0, 55.0, 54.0, 50.0, 42.0, 32.0, 23.0, 18.0, 22.0, 26.0, 16.0, 17.0, 16.0, 13.0, 11.0, 2.0, 4.0, 4.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1429443359375, -0.13803482055664062, -0.13312530517578125, -0.12821578979492188, -0.1233062744140625, -0.11839675903320312, -0.11348724365234375, -0.10857772827148438, -0.103668212890625, -0.09875869750976562, -0.09384918212890625, -0.08893966674804688, -0.0840301513671875, -0.07912063598632812, -0.07421112060546875, -0.06930160522460938, -0.06439208984375, -0.059482574462890625, -0.05457305908203125, -0.049663543701171875, -0.0447540283203125, -0.039844512939453125, -0.03493499755859375, -0.030025482177734375, -0.025115966796875, -0.020206451416015625, -0.01529693603515625, -0.010387420654296875, -0.0054779052734375, -0.000568389892578125, 0.00434112548828125, 0.009250640869140625, 0.01416015625, 0.019069671630859375, 0.02397918701171875, 0.028888702392578125, 0.0337982177734375, 0.038707733154296875, 0.04361724853515625, 0.048526763916015625, 0.053436279296875, 0.058345794677734375, 0.06325531005859375, 0.06816482543945312, 0.0730743408203125, 0.07798385620117188, 0.08289337158203125, 0.08780288696289062, 0.09271240234375, 0.09762191772460938, 0.10253143310546875, 0.10744094848632812, 0.1123504638671875, 0.11725997924804688, 0.12216949462890625, 0.12707901000976562, 0.131988525390625, 0.13689804077148438, 0.14180755615234375, 0.14671707153320312, 0.1516265869140625, 0.15653610229492188, 0.16144561767578125, 0.16635513305664062, 0.1712646484375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 5.0, 3.0, 1.0, 4.0, 6.0, 11.0, 6.0, 12.0, 22.0, 33.0, 42.0, 67.0, 120.0, 234.0, 560.0, 2023.0, 11973.0, 129527.0, 3364816.0, 646010.0, 32891.0, 4237.0, 978.0, 312.0, 156.0, 82.0, 37.0, 42.0, 24.0, 8.0, 12.0, 9.0, 7.0, 6.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.474609375, -0.45916748046875, -0.4437255859375, -0.42828369140625, -0.412841796875, -0.39739990234375, -0.3819580078125, -0.36651611328125, -0.35107421875, -0.33563232421875, -0.3201904296875, -0.30474853515625, -0.289306640625, -0.27386474609375, -0.2584228515625, -0.24298095703125, -0.2275390625, -0.21209716796875, -0.1966552734375, -0.18121337890625, -0.165771484375, -0.15032958984375, -0.1348876953125, -0.11944580078125, -0.10400390625, -0.08856201171875, -0.0731201171875, -0.05767822265625, -0.042236328125, -0.02679443359375, -0.0113525390625, 0.00408935546875, 0.01953125, 0.03497314453125, 0.0504150390625, 0.06585693359375, 0.081298828125, 0.09674072265625, 0.1121826171875, 0.12762451171875, 0.14306640625, 0.15850830078125, 0.1739501953125, 0.18939208984375, 0.204833984375, 0.22027587890625, 0.2357177734375, 0.25115966796875, 0.2666015625, 0.28204345703125, 0.2974853515625, 0.31292724609375, 0.328369140625, 0.34381103515625, 0.3592529296875, 0.37469482421875, 0.39013671875, 0.40557861328125, 0.4210205078125, 0.43646240234375, 0.451904296875, 0.46734619140625, 0.4827880859375, 0.49822998046875, 0.513671875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 7.0, 7.0, 15.0, 13.0, 19.0, 24.0, 37.0, 43.0, 57.0, 94.0, 126.0, 201.0, 350.0, 458.0, 539.0, 670.0, 480.0, 307.0, 196.0, 121.0, 99.0, 51.0, 55.0, 27.0, 23.0, 17.0, 9.0, 7.0, 7.0, 9.0, 3.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33642578125, -0.3259239196777344, -0.31542205810546875, -0.3049201965332031, -0.2944183349609375, -0.2839164733886719, -0.27341461181640625, -0.2629127502441406, -0.252410888671875, -0.24190902709960938, -0.23140716552734375, -0.22090530395507812, -0.2104034423828125, -0.19990158081054688, -0.18939971923828125, -0.17889785766601562, -0.16839599609375, -0.15789413452148438, -0.14739227294921875, -0.13689041137695312, -0.1263885498046875, -0.11588668823242188, -0.10538482666015625, -0.09488296508789062, -0.084381103515625, -0.07387924194335938, -0.06337738037109375, -0.052875518798828125, -0.0423736572265625, -0.031871795654296875, -0.02136993408203125, -0.010868072509765625, -0.0003662109375, 0.010135650634765625, 0.02063751220703125, 0.031139373779296875, 0.0416412353515625, 0.052143096923828125, 0.06264495849609375, 0.07314682006835938, 0.083648681640625, 0.09415054321289062, 0.10465240478515625, 0.11515426635742188, 0.1256561279296875, 0.13615798950195312, 0.14665985107421875, 0.15716171264648438, 0.16766357421875, 0.17816543579101562, 0.18866729736328125, 0.19916915893554688, 0.2096710205078125, 0.22017288208007812, 0.23067474365234375, 0.24117660522460938, 0.251678466796875, 0.2621803283691406, 0.27268218994140625, 0.2831840515136719, 0.2936859130859375, 0.3041877746582031, 0.31468963623046875, 0.3251914978027344, 0.335693359375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 4.0, 15.0, 27.0, 143.0, 316.0, 338.0, 102.0, 32.0, 15.0, 8.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.793111801147461, -11.566461563110352, -11.339810371398926, -11.113160133361816, -10.886509895324707, -10.659858703613281, -10.433208465576172, -10.206558227539062, -9.979907035827637, -9.753256797790527, -9.526605606079102, -9.299955368041992, -9.073305130004883, -8.846653938293457, -8.620003700256348, -8.393353462219238, -8.166703224182129, -7.940052509307861, -7.713402271270752, -7.486751556396484, -7.260100841522217, -7.033450603485107, -6.80679988861084, -6.5801496505737305, -6.353498458862305, -6.126847743988037, -5.900197505950928, -5.67354679107666, -5.446896076202393, -5.220245838165283, -4.993595123291016, -4.766944885253906, -4.5402936935424805, -4.313642978668213, -4.0869927406311035, -3.860342025756836, -3.6336915493011475, -3.407041072845459, -3.1803903579711914, -2.953739881515503, -2.7270894050598145, -2.500438928604126, -2.2737882137298584, -2.04713773727417, -1.8204872608184814, -1.5938366651535034, -1.3671860694885254, -1.140535593032837, -0.9138851165771484, -0.6872345805168152, -0.46058401465415955, -0.2339334487915039, -0.007282912731170654, 0.2193676233291626, 0.4460182189941406, 0.6726686954498291, 0.8993192911148071, 1.1259698867797852, 1.3526203632354736, 1.5792709589004517, 1.8059215545654297, 2.032572031021118, 2.2592225074768066, 2.485873222351074, 2.7125236988067627]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 0.0, 3.0, 6.0, 6.0, 5.0, 5.0, 11.0, 11.0, 12.0, 9.0, 7.0, 11.0, 18.0, 12.0, 23.0, 24.0, 24.0, 21.0, 33.0, 33.0, 39.0, 26.0, 38.0, 36.0, 22.0, 40.0, 32.0, 41.0, 32.0, 25.0, 37.0, 44.0, 28.0, 34.0, 31.0, 32.0, 23.0, 21.0, 21.0, 23.0, 16.0, 10.0, 18.0, 9.0, 10.0, 10.0, 10.0, 3.0, 4.0, 3.0, 4.0, 6.0, 2.0, 3.0, 1.0, 2.0, 1.0, 4.0], "bins": [-1.1417587995529175, -1.106102466583252, -1.0704461336135864, -1.034789800643921, -0.9991334676742554, -0.9634771347045898, -0.9278208017349243, -0.8921644687652588, -0.8565081357955933, -0.8208518028259277, -0.7851954698562622, -0.7495391368865967, -0.7138828039169312, -0.6782264709472656, -0.6425701379776001, -0.6069138050079346, -0.5712575316429138, -0.5356011986732483, -0.49994486570358276, -0.46428853273391724, -0.4286321997642517, -0.3929758667945862, -0.35731956362724304, -0.3216632306575775, -0.286006897687912, -0.25035056471824646, -0.21469423174858093, -0.1790379136800766, -0.14338158071041107, -0.10772524774074554, -0.07206892967224121, -0.036412596702575684, -0.0007562637329101562, 0.03490006551146507, 0.0705563947558403, 0.10621272027492523, 0.14186905324459076, 0.1775253862142563, 0.21318170428276062, 0.24883803725242615, 0.2844943702220917, 0.3201507031917572, 0.35580703616142273, 0.39146333932876587, 0.4271196722984314, 0.4627760052680969, 0.49843233823776245, 0.534088671207428, 0.5697450041770935, 0.605401337146759, 0.6410576701164246, 0.6767140030860901, 0.7123703360557556, 0.7480266690254211, 0.7836829423904419, 0.8193392753601074, 0.854995608329773, 0.8906519412994385, 0.926308274269104, 0.9619646072387695, 0.9976209402084351, 1.0332772731781006, 1.0689336061477661, 1.1045899391174316, 1.1402462720870972]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 8.0, 7.0, 7.0, 14.0, 10.0, 22.0, 32.0, 40.0, 45.0, 75.0, 129.0, 186.0, 270.0, 354.0, 614.0, 953.0, 1560.0, 2932.0, 5791.0, 13231.0, 35589.0, 120050.0, 390408.0, 330964.0, 93723.0, 28747.0, 11098.0, 5143.0, 2697.0, 1392.0, 822.0, 575.0, 337.0, 241.0, 146.0, 100.0, 68.0, 50.0, 40.0, 22.0, 16.0, 13.0, 15.0, 13.0, 3.0, 1.0, 6.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.20849609375, -0.2017498016357422, -0.19500350952148438, -0.18825721740722656, -0.18151092529296875, -0.17476463317871094, -0.16801834106445312, -0.1612720489501953, -0.1545257568359375, -0.1477794647216797, -0.14103317260742188, -0.13428688049316406, -0.12754058837890625, -0.12079429626464844, -0.11404800415039062, -0.10730171203613281, -0.100555419921875, -0.09380912780761719, -0.08706283569335938, -0.08031654357910156, -0.07357025146484375, -0.06682395935058594, -0.060077667236328125, -0.05333137512207031, -0.0465850830078125, -0.03983879089355469, -0.033092498779296875, -0.026346206665039062, -0.01959991455078125, -0.012853622436523438, -0.006107330322265625, 0.0006389617919921875, 0.00738525390625, 0.014131546020507812, 0.020877838134765625, 0.027624130249023438, 0.03437042236328125, 0.04111671447753906, 0.047863006591796875, 0.05460929870605469, 0.0613555908203125, 0.06810188293457031, 0.07484817504882812, 0.08159446716308594, 0.08834075927734375, 0.09508705139160156, 0.10183334350585938, 0.10857963562011719, 0.115325927734375, 0.12207221984863281, 0.12881851196289062, 0.13556480407714844, 0.14231109619140625, 0.14905738830566406, 0.15580368041992188, 0.1625499725341797, 0.1692962646484375, 0.1760425567626953, 0.18278884887695312, 0.18953514099121094, 0.19628143310546875, 0.20302772521972656, 0.20977401733398438, 0.2165203094482422, 0.2232666015625]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 6.0, 6.0, 6.0, 7.0, 11.0, 16.0, 21.0, 29.0, 23.0, 24.0, 41.0, 27.0, 39.0, 35.0, 41.0, 46.0, 42.0, 53.0, 45.0, 61.0, 56.0, 56.0, 37.0, 31.0, 38.0, 39.0, 29.0, 29.0, 24.0, 16.0, 18.0, 8.0, 13.0, 5.0, 8.0, 4.0, 3.0, 5.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1436767578125, -0.13857460021972656, -0.13347244262695312, -0.1283702850341797, -0.12326812744140625, -0.11816596984863281, -0.11306381225585938, -0.10796165466308594, -0.1028594970703125, -0.09775733947753906, -0.09265518188476562, -0.08755302429199219, -0.08245086669921875, -0.07734870910644531, -0.07224655151367188, -0.06714439392089844, -0.062042236328125, -0.05694007873535156, -0.051837921142578125, -0.04673576354980469, -0.04163360595703125, -0.03653144836425781, -0.031429290771484375, -0.026327133178710938, -0.0212249755859375, -0.016122817993164062, -0.011020660400390625, -0.0059185028076171875, -0.00081634521484375, 0.0042858123779296875, 0.009387969970703125, 0.014490127563476562, 0.01959228515625, 0.024694442749023438, 0.029796600341796875, 0.03489875793457031, 0.04000091552734375, 0.04510307312011719, 0.050205230712890625, 0.05530738830566406, 0.0604095458984375, 0.06551170349121094, 0.07061386108398438, 0.07571601867675781, 0.08081817626953125, 0.08592033386230469, 0.09102249145507812, 0.09612464904785156, 0.101226806640625, 0.10632896423339844, 0.11143112182617188, 0.11653327941894531, 0.12163543701171875, 0.1267375946044922, 0.13183975219726562, 0.13694190979003906, 0.1420440673828125, 0.14714622497558594, 0.15224838256835938, 0.1573505401611328, 0.16245269775390625, 0.1675548553466797, 0.17265701293945312, 0.17775917053222656, 0.182861328125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 2.0, 7.0, 6.0, 5.0, 15.0, 21.0, 19.0, 32.0, 31.0, 49.0, 68.0, 146.0, 206.0, 279.0, 569.0, 1157.0, 2932.0, 10884.0, 77215.0, 791950.0, 140172.0, 15867.0, 3844.0, 1451.0, 641.0, 351.0, 216.0, 136.0, 72.0, 59.0, 38.0, 35.0, 24.0, 16.0, 7.0, 13.0, 8.0, 8.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.42431640625, -0.41089630126953125, -0.3974761962890625, -0.38405609130859375, -0.370635986328125, -0.35721588134765625, -0.3437957763671875, -0.33037567138671875, -0.31695556640625, -0.30353546142578125, -0.2901153564453125, -0.27669525146484375, -0.263275146484375, -0.24985504150390625, -0.2364349365234375, -0.22301483154296875, -0.2095947265625, -0.19617462158203125, -0.1827545166015625, -0.16933441162109375, -0.155914306640625, -0.14249420166015625, -0.1290740966796875, -0.11565399169921875, -0.10223388671875, -0.08881378173828125, -0.0753936767578125, -0.06197357177734375, -0.048553466796875, -0.03513336181640625, -0.0217132568359375, -0.00829315185546875, 0.005126953125, 0.01854705810546875, 0.0319671630859375, 0.04538726806640625, 0.058807373046875, 0.07222747802734375, 0.0856475830078125, 0.09906768798828125, 0.11248779296875, 0.12590789794921875, 0.1393280029296875, 0.15274810791015625, 0.166168212890625, 0.17958831787109375, 0.1930084228515625, 0.20642852783203125, 0.2198486328125, 0.23326873779296875, 0.2466888427734375, 0.26010894775390625, 0.273529052734375, 0.28694915771484375, 0.3003692626953125, 0.31378936767578125, 0.32720947265625, 0.34062957763671875, 0.3540496826171875, 0.36746978759765625, 0.380889892578125, 0.39430999755859375, 0.4077301025390625, 0.42115020751953125, 0.4345703125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 4.0, 8.0, 8.0, 6.0, 11.0, 9.0, 15.0, 15.0, 20.0, 22.0, 33.0, 43.0, 39.0, 41.0, 54.0, 52.0, 37.0, 70.0, 64.0, 63.0, 42.0, 59.0, 43.0, 50.0, 27.0, 36.0, 25.0, 23.0, 17.0, 14.0, 17.0, 8.0, 6.0, 6.0, 2.0, 5.0, 2.0, 4.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.59228515625, -0.5718154907226562, -0.5513458251953125, -0.5308761596679688, -0.510406494140625, -0.48993682861328125, -0.4694671630859375, -0.44899749755859375, -0.42852783203125, -0.40805816650390625, -0.3875885009765625, -0.36711883544921875, -0.346649169921875, -0.32617950439453125, -0.3057098388671875, -0.28524017333984375, -0.2647705078125, -0.24430084228515625, -0.2238311767578125, -0.20336151123046875, -0.182891845703125, -0.16242218017578125, -0.1419525146484375, -0.12148284912109375, -0.10101318359375, -0.08054351806640625, -0.0600738525390625, -0.03960418701171875, -0.019134521484375, 0.00133514404296875, 0.0218048095703125, 0.04227447509765625, 0.062744140625, 0.08321380615234375, 0.1036834716796875, 0.12415313720703125, 0.144622802734375, 0.16509246826171875, 0.1855621337890625, 0.20603179931640625, 0.22650146484375, 0.24697113037109375, 0.2674407958984375, 0.28791046142578125, 0.308380126953125, 0.32884979248046875, 0.3493194580078125, 0.36978912353515625, 0.3902587890625, 0.41072845458984375, 0.4311981201171875, 0.45166778564453125, 0.472137451171875, 0.49260711669921875, 0.5130767822265625, 0.5335464477539062, 0.55401611328125, 0.5744857788085938, 0.5949554443359375, 0.6154251098632812, 0.635894775390625, 0.6563644409179688, 0.6768341064453125, 0.6973037719726562, 0.7177734375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 9.0, 5.0, 10.0, 12.0, 18.0, 35.0, 55.0, 92.0, 198.0, 337.0, 653.0, 1366.0, 3278.0, 8952.0, 31766.0, 179772.0, 710198.0, 83045.0, 18403.0, 5953.0, 2254.0, 1026.0, 502.0, 248.0, 149.0, 75.0, 55.0, 38.0, 21.0, 11.0, 8.0, 6.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.167236328125, -0.16318702697753906, -0.15913772583007812, -0.1550884246826172, -0.15103912353515625, -0.1469898223876953, -0.14294052124023438, -0.13889122009277344, -0.1348419189453125, -0.13079261779785156, -0.12674331665039062, -0.12269401550292969, -0.11864471435546875, -0.11459541320800781, -0.11054611206054688, -0.10649681091308594, -0.102447509765625, -0.09839820861816406, -0.09434890747070312, -0.09029960632324219, -0.08625030517578125, -0.08220100402832031, -0.07815170288085938, -0.07410240173339844, -0.0700531005859375, -0.06600379943847656, -0.061954498291015625, -0.05790519714355469, -0.05385589599609375, -0.04980659484863281, -0.045757293701171875, -0.04170799255371094, -0.03765869140625, -0.03360939025878906, -0.029560089111328125, -0.025510787963867188, -0.02146148681640625, -0.017412185668945312, -0.013362884521484375, -0.009313583374023438, -0.0052642822265625, -0.0012149810791015625, 0.002834320068359375, 0.0068836212158203125, 0.01093292236328125, 0.014982223510742188, 0.019031524658203125, 0.023080825805664062, 0.027130126953125, 0.031179428100585938, 0.035228729248046875, 0.03927803039550781, 0.04332733154296875, 0.04737663269042969, 0.051425933837890625, 0.05547523498535156, 0.0595245361328125, 0.06357383728027344, 0.06762313842773438, 0.07167243957519531, 0.07572174072265625, 0.07977104187011719, 0.08382034301757812, 0.08786964416503906, 0.0919189453125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 5.0, 8.0, 10.0, 14.0, 17.0, 24.0, 31.0, 65.0, 100.0, 106.0, 115.0, 129.0, 127.0, 81.0, 51.0, 32.0, 30.0, 22.0, 10.0, 5.0, 4.0, 4.0, 0.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.59687614440918e-05, -5.395989865064621e-05, -5.195103585720062e-05, -4.9942173063755035e-05, -4.793331027030945e-05, -4.592444747686386e-05, -4.3915584683418274e-05, -4.190672188997269e-05, -3.98978590965271e-05, -3.788899630308151e-05, -3.5880133509635925e-05, -3.387127071619034e-05, -3.186240792274475e-05, -2.9853545129299164e-05, -2.7844682335853577e-05, -2.583581954240799e-05, -2.3826956748962402e-05, -2.1818093955516815e-05, -1.9809231162071228e-05, -1.780036836862564e-05, -1.5791505575180054e-05, -1.3782642781734467e-05, -1.177377998828888e-05, -9.764917194843292e-06, -7.756054401397705e-06, -5.747191607952118e-06, -3.7383288145065308e-06, -1.7294660210609436e-06, 2.7939677238464355e-07, 2.2882595658302307e-06, 4.297122359275818e-06, 6.305985152721405e-06, 8.314847946166992e-06, 1.032371073961258e-05, 1.2332573533058167e-05, 1.4341436326503754e-05, 1.635029911994934e-05, 1.8359161913394928e-05, 2.0368024706840515e-05, 2.2376887500286102e-05, 2.438575029373169e-05, 2.6394613087177277e-05, 2.8403475880622864e-05, 3.041233867406845e-05, 3.242120146751404e-05, 3.4430064260959625e-05, 3.643892705440521e-05, 3.84477898478508e-05, 4.045665264129639e-05, 4.2465515434741974e-05, 4.447437822818756e-05, 4.648324102163315e-05, 4.8492103815078735e-05, 5.050096660852432e-05, 5.250982940196991e-05, 5.45186921954155e-05, 5.6527554988861084e-05, 5.853641778230667e-05, 6.054528057575226e-05, 6.255414336919785e-05, 6.456300616264343e-05, 6.657186895608902e-05, 6.858073174953461e-05, 7.05895945429802e-05, 7.259845733642578e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 6.0, 8.0, 7.0, 8.0, 16.0, 26.0, 43.0, 55.0, 106.0, 184.0, 319.0, 626.0, 1426.0, 3329.0, 9452.0, 34015.0, 190586.0, 695328.0, 83976.0, 18705.0, 5981.0, 2219.0, 1033.0, 453.0, 271.0, 145.0, 80.0, 56.0, 38.0, 21.0, 13.0, 7.0, 6.0, 7.0, 5.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1334228515625, -0.12915802001953125, -0.1248931884765625, -0.12062835693359375, -0.116363525390625, -0.11209869384765625, -0.1078338623046875, -0.10356903076171875, -0.09930419921875, -0.09503936767578125, -0.0907745361328125, -0.08650970458984375, -0.082244873046875, -0.07798004150390625, -0.0737152099609375, -0.06945037841796875, -0.065185546875, -0.06092071533203125, -0.0566558837890625, -0.05239105224609375, -0.048126220703125, -0.04386138916015625, -0.0395965576171875, -0.03533172607421875, -0.03106689453125, -0.02680206298828125, -0.0225372314453125, -0.01827239990234375, -0.014007568359375, -0.00974273681640625, -0.0054779052734375, -0.00121307373046875, 0.0030517578125, 0.00731658935546875, 0.0115814208984375, 0.01584625244140625, 0.020111083984375, 0.02437591552734375, 0.0286407470703125, 0.03290557861328125, 0.03717041015625, 0.04143524169921875, 0.0457000732421875, 0.04996490478515625, 0.054229736328125, 0.05849456787109375, 0.0627593994140625, 0.06702423095703125, 0.0712890625, 0.07555389404296875, 0.0798187255859375, 0.08408355712890625, 0.088348388671875, 0.09261322021484375, 0.0968780517578125, 0.10114288330078125, 0.10540771484375, 0.10967254638671875, 0.1139373779296875, 0.11820220947265625, 0.122467041015625, 0.12673187255859375, 0.1309967041015625, 0.13526153564453125, 0.1395263671875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 5.0, 2.0, 2.0, 8.0, 11.0, 8.0, 13.0, 25.0, 16.0, 25.0, 26.0, 44.0, 48.0, 70.0, 84.0, 102.0, 92.0, 105.0, 73.0, 59.0, 45.0, 26.0, 24.0, 16.0, 14.0, 12.0, 5.0, 6.0, 5.0, 6.0, 4.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.09637451171875, -0.0927896499633789, -0.08920478820800781, -0.08561992645263672, -0.08203506469726562, -0.07845020294189453, -0.07486534118652344, -0.07128047943115234, -0.06769561767578125, -0.06411075592041016, -0.06052589416503906, -0.05694103240966797, -0.053356170654296875, -0.04977130889892578, -0.04618644714355469, -0.042601585388183594, -0.0390167236328125, -0.035431861877441406, -0.03184700012207031, -0.02826213836669922, -0.024677276611328125, -0.02109241485595703, -0.017507553100585938, -0.013922691345214844, -0.01033782958984375, -0.006752967834472656, -0.0031681060791015625, 0.00041675567626953125, 0.004001617431640625, 0.007586479187011719, 0.011171340942382812, 0.014756202697753906, 0.018341064453125, 0.021925926208496094, 0.025510787963867188, 0.02909564971923828, 0.032680511474609375, 0.03626537322998047, 0.03985023498535156, 0.043435096740722656, 0.04701995849609375, 0.050604820251464844, 0.05418968200683594, 0.05777454376220703, 0.061359405517578125, 0.06494426727294922, 0.06852912902832031, 0.0721139907836914, 0.0756988525390625, 0.0792837142944336, 0.08286857604980469, 0.08645343780517578, 0.09003829956054688, 0.09362316131591797, 0.09720802307128906, 0.10079288482666016, 0.10437774658203125, 0.10796260833740234, 0.11154747009277344, 0.11513233184814453, 0.11871719360351562, 0.12230205535888672, 0.1258869171142578, 0.1294717788696289, 0.133056640625]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 1.0, 9.0, 15.0, 18.0, 53.0, 117.0, 191.0, 297.0, 151.0, 72.0, 28.0, 22.0, 9.0, 6.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9592761993408203, -1.8519467115402222, -1.744617223739624, -1.6372878551483154, -1.5299582481384277, -1.4226288795471191, -1.315299391746521, -1.2079699039459229, -1.1006404161453247, -0.9933109283447266, -0.8859814405441284, -0.778652012348175, -0.6713225245475769, -0.5639930367469788, -0.4566636085510254, -0.34933412075042725, -0.2420046329498291, -0.13467516005039215, -0.0273456871509552, 0.07998377084732056, 0.1873132586479187, 0.29464274644851685, 0.4019721746444702, 0.5093016624450684, 0.6166311502456665, 0.7239606380462646, 0.8312901258468628, 0.9386195540428162, 1.0459489822387695, 1.1532785892486572, 1.2606079578399658, 1.367937445640564, 1.475266933441162, 1.5825964212417603, 1.6899259090423584, 1.797255277633667, 1.9045848846435547, 2.0119142532348633, 2.119243621826172, 2.2265732288360596, 2.3339028358459473, 2.441232204437256, 2.5485618114471436, 2.655891180038452, 2.76322078704834, 2.8705501556396484, 2.977879524230957, 3.0852091312408447, 3.1925384998321533, 3.299867868423462, 3.4071974754333496, 3.514526844024658, 3.621856451034546, 3.7291858196258545, 3.836515426635742, 3.943844795227051, 4.051174163818359, 4.158503532409668, 4.265832901000977, 4.373162746429443, 4.480492115020752, 4.5878214836120605, 4.695150852203369, 4.802480697631836, 4.9098100662231445]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 3.0, 7.0, 4.0, 11.0, 5.0, 9.0, 18.0, 18.0, 17.0, 28.0, 33.0, 24.0, 27.0, 41.0, 39.0, 60.0, 102.0, 103.0, 91.0, 52.0, 50.0, 34.0, 28.0, 28.0, 30.0, 25.0, 16.0, 22.0, 17.0, 13.0, 9.0, 11.0, 5.0, 7.0, 4.0, 1.0, 7.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.645404100418091, -2.5691723823547363, -2.4929404258728027, -2.4167087078094482, -2.3404769897460938, -2.26424503326416, -2.1880133152008057, -2.111781597137451, -2.0355496406555176, -1.9593178033828735, -1.8830859661102295, -1.806854248046875, -1.730622410774231, -1.654390573501587, -1.5781588554382324, -1.5019270181655884, -1.4256951808929443, -1.3494633436203003, -1.2732315063476562, -1.1969997882843018, -1.1207679510116577, -1.0445361137390137, -0.9683043360710144, -0.8920725584030151, -0.8158407211303711, -0.739608883857727, -0.6633771061897278, -0.5871453285217285, -0.5109134912490845, -0.4346816837787628, -0.35844987630844116, -0.2822180986404419, -0.20598649978637695, -0.1297546923160553, -0.05352288484573364, 0.022708922624588013, 0.09894073009490967, 0.17517253756523132, 0.251404345035553, 0.32763612270355225, 0.4038679599761963, 0.48009976744651794, 0.5563315749168396, 0.6325633525848389, 0.7087951898574829, 0.785027027130127, 0.8612588047981262, 0.9374905824661255, 1.0137224197387695, 1.0899542570114136, 1.1661860942840576, 1.242417812347412, 1.3186496496200562, 1.3948814868927002, 1.4711132049560547, 1.5473450422286987, 1.6235768795013428, 1.6998087167739868, 1.7760405540466309, 1.8522722721099854, 1.9285041093826294, 2.0047359466552734, 2.080967664718628, 2.1571993827819824, 2.233431339263916]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 1.0, 6.0, 4.0, 4.0, 6.0, 10.0, 20.0, 12.0, 32.0, 43.0, 39.0, 112.0, 186.0, 403.0, 872.0, 2054.0, 5017.0, 14696.0, 53734.0, 295129.0, 1985511.0, 1560115.0, 216967.0, 40617.0, 11464.0, 3884.0, 1656.0, 715.0, 360.0, 197.0, 106.0, 63.0, 58.0, 31.0, 30.0, 24.0, 22.0, 14.0, 5.0, 8.0, 10.0, 11.0, 9.0, 4.0, 5.0, 2.0, 5.0, 7.0, 2.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.1776123046875, -0.1704845428466797, -0.16335678100585938, -0.15622901916503906, -0.14910125732421875, -0.14197349548339844, -0.13484573364257812, -0.1277179718017578, -0.1205902099609375, -0.11346244812011719, -0.10633468627929688, -0.09920692443847656, -0.09207916259765625, -0.08495140075683594, -0.07782363891601562, -0.07069587707519531, -0.063568115234375, -0.05644035339355469, -0.049312591552734375, -0.04218482971191406, -0.03505706787109375, -0.027929306030273438, -0.020801544189453125, -0.013673782348632812, -0.0065460205078125, 0.0005817413330078125, 0.007709503173828125, 0.014837265014648438, 0.02196502685546875, 0.029092788696289062, 0.036220550537109375, 0.04334831237792969, 0.05047607421875, 0.05760383605957031, 0.06473159790039062, 0.07185935974121094, 0.07898712158203125, 0.08611488342285156, 0.09324264526367188, 0.10037040710449219, 0.1074981689453125, 0.11462593078613281, 0.12175369262695312, 0.12888145446777344, 0.13600921630859375, 0.14313697814941406, 0.15026473999023438, 0.1573925018310547, 0.164520263671875, 0.1716480255126953, 0.17877578735351562, 0.18590354919433594, 0.19303131103515625, 0.20015907287597656, 0.20728683471679688, 0.2144145965576172, 0.2215423583984375, 0.2286701202392578, 0.23579788208007812, 0.24292564392089844, 0.25005340576171875, 0.25718116760253906, 0.2643089294433594, 0.2714366912841797, 0.278564453125]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 9.0, 6.0, 8.0, 15.0, 19.0, 15.0, 16.0, 26.0, 34.0, 28.0, 34.0, 37.0, 37.0, 44.0, 49.0, 31.0, 53.0, 60.0, 42.0, 51.0, 51.0, 56.0, 37.0, 33.0, 43.0, 37.0, 23.0, 23.0, 24.0, 12.0, 9.0, 8.0, 3.0, 6.0, 7.0, 0.0, 5.0, 3.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1328125, -0.127838134765625, -0.12286376953125, -0.117889404296875, -0.1129150390625, -0.107940673828125, -0.10296630859375, -0.097991943359375, -0.093017578125, -0.088043212890625, -0.08306884765625, -0.078094482421875, -0.0731201171875, -0.068145751953125, -0.06317138671875, -0.058197021484375, -0.05322265625, -0.048248291015625, -0.04327392578125, -0.038299560546875, -0.0333251953125, -0.028350830078125, -0.02337646484375, -0.018402099609375, -0.013427734375, -0.008453369140625, -0.00347900390625, 0.001495361328125, 0.0064697265625, 0.011444091796875, 0.01641845703125, 0.021392822265625, 0.0263671875, 0.031341552734375, 0.03631591796875, 0.041290283203125, 0.0462646484375, 0.051239013671875, 0.05621337890625, 0.061187744140625, 0.066162109375, 0.071136474609375, 0.07611083984375, 0.081085205078125, 0.0860595703125, 0.091033935546875, 0.09600830078125, 0.100982666015625, 0.10595703125, 0.110931396484375, 0.11590576171875, 0.120880126953125, 0.1258544921875, 0.130828857421875, 0.13580322265625, 0.140777587890625, 0.145751953125, 0.150726318359375, 0.15570068359375, 0.160675048828125, 0.1656494140625, 0.170623779296875, 0.17559814453125, 0.180572509765625, 0.185546875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 2.0, 4.0, 4.0, 11.0, 6.0, 12.0, 13.0, 15.0, 33.0, 39.0, 58.0, 96.0, 162.0, 300.0, 777.0, 2368.0, 10195.0, 72270.0, 1555945.0, 2433734.0, 101017.0, 12807.0, 2691.0, 852.0, 341.0, 172.0, 107.0, 58.0, 47.0, 33.0, 27.0, 18.0, 17.0, 9.0, 12.0, 6.0, 4.0, 7.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.443359375, -0.43071746826171875, -0.4180755615234375, -0.40543365478515625, -0.392791748046875, -0.38014984130859375, -0.3675079345703125, -0.35486602783203125, -0.34222412109375, -0.32958221435546875, -0.3169403076171875, -0.30429840087890625, -0.291656494140625, -0.27901458740234375, -0.2663726806640625, -0.25373077392578125, -0.2410888671875, -0.22844696044921875, -0.2158050537109375, -0.20316314697265625, -0.190521240234375, -0.17787933349609375, -0.1652374267578125, -0.15259552001953125, -0.13995361328125, -0.12731170654296875, -0.1146697998046875, -0.10202789306640625, -0.089385986328125, -0.07674407958984375, -0.0641021728515625, -0.05146026611328125, -0.038818359375, -0.02617645263671875, -0.0135345458984375, -0.00089263916015625, 0.011749267578125, 0.02439117431640625, 0.0370330810546875, 0.04967498779296875, 0.06231689453125, 0.07495880126953125, 0.0876007080078125, 0.10024261474609375, 0.112884521484375, 0.12552642822265625, 0.1381683349609375, 0.15081024169921875, 0.1634521484375, 0.17609405517578125, 0.1887359619140625, 0.20137786865234375, 0.214019775390625, 0.22666168212890625, 0.2393035888671875, 0.25194549560546875, 0.26458740234375, 0.27722930908203125, 0.2898712158203125, 0.30251312255859375, 0.315155029296875, 0.32779693603515625, 0.3404388427734375, 0.35308074951171875, 0.36572265625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 11.0, 4.0, 10.0, 5.0, 11.0, 17.0, 19.0, 28.0, 23.0, 41.0, 55.0, 64.0, 98.0, 118.0, 160.0, 220.0, 307.0, 383.0, 507.0, 439.0, 404.0, 276.0, 207.0, 182.0, 117.0, 79.0, 65.0, 62.0, 31.0, 31.0, 21.0, 15.0, 14.0, 5.0, 9.0, 8.0, 7.0, 5.0, 1.0, 4.0, 4.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.276123046875, -0.2682323455810547, -0.2603416442871094, -0.25245094299316406, -0.24456024169921875, -0.23666954040527344, -0.22877883911132812, -0.2208881378173828, -0.2129974365234375, -0.2051067352294922, -0.19721603393554688, -0.18932533264160156, -0.18143463134765625, -0.17354393005371094, -0.16565322875976562, -0.1577625274658203, -0.149871826171875, -0.1419811248779297, -0.13409042358398438, -0.12619972229003906, -0.11830902099609375, -0.11041831970214844, -0.10252761840820312, -0.09463691711425781, -0.0867462158203125, -0.07885551452636719, -0.07096481323242188, -0.06307411193847656, -0.05518341064453125, -0.04729270935058594, -0.039402008056640625, -0.03151130676269531, -0.02362060546875, -0.015729904174804688, -0.007839202880859375, 5.14984130859375e-05, 0.00794219970703125, 0.015832901000976562, 0.023723602294921875, 0.03161430358886719, 0.0395050048828125, 0.04739570617675781, 0.055286407470703125, 0.06317710876464844, 0.07106781005859375, 0.07895851135253906, 0.08684921264648438, 0.09473991394042969, 0.102630615234375, 0.11052131652832031, 0.11841201782226562, 0.12630271911621094, 0.13419342041015625, 0.14208412170410156, 0.14997482299804688, 0.1578655242919922, 0.1657562255859375, 0.1736469268798828, 0.18153762817382812, 0.18942832946777344, 0.19731903076171875, 0.20520973205566406, 0.21310043334960938, 0.2209911346435547, 0.2288818359375]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 7.0, 8.0, 8.0, 8.0, 4.0, 16.0, 28.0, 56.0, 67.0, 87.0, 118.0, 136.0, 134.0, 115.0, 75.0, 52.0, 29.0, 20.0, 11.0, 8.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1091694831848145, -2.0345773696899414, -1.9599854946136475, -1.8853933811187744, -1.810801386833191, -1.7362093925476074, -1.6616172790527344, -1.5870252847671509, -1.5124332904815674, -1.4378412961959839, -1.3632493019104004, -1.2886571884155273, -1.2140651941299438, -1.1394731998443604, -1.0648810863494873, -0.9902890920639038, -0.9156970977783203, -0.8411051034927368, -0.7665130496025085, -0.6919209957122803, -0.6173290014266968, -0.5427370071411133, -0.468144953250885, -0.39355289936065674, -0.31896090507507324, -0.24436888098716736, -0.16977685689926147, -0.09518483281135559, -0.020592808723449707, 0.05399921536445618, 0.12859123945236206, 0.20318329334259033, 0.27777528762817383, 0.3523673117160797, 0.4269593358039856, 0.5015513896942139, 0.5761433839797974, 0.6507353782653809, 0.7253274321556091, 0.7999194860458374, 0.8745114803314209, 0.9491034746170044, 1.023695468902588, 1.098287582397461, 1.1728795766830444, 1.247471570968628, 1.322063684463501, 1.3966556787490845, 1.471247673034668, 1.5458396673202515, 1.620431661605835, 1.695023775100708, 1.7696157693862915, 1.844207763671875, 1.918799877166748, 1.9933918714523315, 2.067983865737915, 2.142575979232788, 2.217167854309082, 2.291759967803955, 2.366352081298828, 2.440943956375122, 2.515536069869995, 2.590127944946289, 2.664720058441162]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 8.0, 4.0, 3.0, 11.0, 13.0, 17.0, 16.0, 33.0, 41.0, 28.0, 47.0, 50.0, 67.0, 49.0, 44.0, 46.0, 51.0, 52.0, 60.0, 69.0, 48.0, 48.0, 31.0, 36.0, 25.0, 24.0, 23.0, 15.0, 14.0, 4.0, 8.0, 7.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6510562896728516, -1.595447063446045, -1.5398379564285278, -1.4842288494110107, -1.428619623184204, -1.3730103969573975, -1.3174012899398804, -1.2617921829223633, -1.2061829566955566, -1.15057373046875, -1.094964623451233, -1.0393555164337158, -0.9837462902069092, -0.9281371235847473, -0.8725279569625854, -0.8169187903404236, -0.7613096237182617, -0.7057004570960999, -0.650091290473938, -0.5944821238517761, -0.5388729572296143, -0.4832637906074524, -0.4276546239852905, -0.37204545736312866, -0.3164362907409668, -0.26082712411880493, -0.20521795749664307, -0.1496087908744812, -0.09399962425231934, -0.03839045763015747, 0.017218708992004395, 0.07282787561416626, 0.12843692302703857, 0.18404608964920044, 0.2396552562713623, 0.29526442289352417, 0.35087358951568604, 0.4064827561378479, 0.46209192276000977, 0.5177010893821716, 0.5733102560043335, 0.6289194226264954, 0.6845285892486572, 0.7401377558708191, 0.795746922492981, 0.8513560891151428, 0.9069652557373047, 0.9625744223594666, 1.0181835889816284, 1.0737926959991455, 1.1294019222259521, 1.1850111484527588, 1.2406202554702759, 1.296229362487793, 1.3518385887145996, 1.4074478149414062, 1.4630569219589233, 1.5186660289764404, 1.574275255203247, 1.6298844814300537, 1.6854935884475708, 1.741102695465088, 1.7967119216918945, 1.8523211479187012, 1.9079302549362183]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 3.0, 14.0, 13.0, 24.0, 28.0, 36.0, 59.0, 98.0, 154.0, 273.0, 502.0, 959.0, 1836.0, 4151.0, 10276.0, 28209.0, 91262.0, 354952.0, 398920.0, 104578.0, 31777.0, 11322.0, 4740.0, 2070.0, 1050.0, 496.0, 280.0, 168.0, 125.0, 67.0, 39.0, 27.0, 15.0, 8.0, 9.0, 7.0, 3.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2366943359375, -0.2288188934326172, -0.22094345092773438, -0.21306800842285156, -0.20519256591796875, -0.19731712341308594, -0.18944168090820312, -0.1815662384033203, -0.1736907958984375, -0.1658153533935547, -0.15793991088867188, -0.15006446838378906, -0.14218902587890625, -0.13431358337402344, -0.12643814086914062, -0.11856269836425781, -0.110687255859375, -0.10281181335449219, -0.09493637084960938, -0.08706092834472656, -0.07918548583984375, -0.07131004333496094, -0.06343460083007812, -0.05555915832519531, -0.0476837158203125, -0.03980827331542969, -0.031932830810546875, -0.024057388305664062, -0.01618194580078125, -0.008306503295898438, -0.000431060791015625, 0.0074443817138671875, 0.01531982421875, 0.023195266723632812, 0.031070709228515625, 0.03894615173339844, 0.04682159423828125, 0.05469703674316406, 0.06257247924804688, 0.07044792175292969, 0.0783233642578125, 0.08619880676269531, 0.09407424926757812, 0.10194969177246094, 0.10982513427734375, 0.11770057678222656, 0.12557601928710938, 0.1334514617919922, 0.141326904296875, 0.1492023468017578, 0.15707778930664062, 0.16495323181152344, 0.17282867431640625, 0.18070411682128906, 0.18857955932617188, 0.1964550018310547, 0.2043304443359375, 0.2122058868408203, 0.22008132934570312, 0.22795677185058594, 0.23583221435546875, 0.24370765686035156, 0.2515830993652344, 0.2594585418701172, 0.267333984375]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 1.0, 0.0, 6.0, 5.0, 5.0, 6.0, 6.0, 6.0, 14.0, 7.0, 22.0, 16.0, 23.0, 28.0, 27.0, 21.0, 26.0, 30.0, 41.0, 39.0, 50.0, 38.0, 31.0, 39.0, 39.0, 58.0, 55.0, 38.0, 42.0, 43.0, 34.0, 33.0, 29.0, 29.0, 18.0, 23.0, 11.0, 12.0, 9.0, 6.0, 9.0, 10.0, 7.0, 3.0, 4.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1270751953125, -0.12250709533691406, -0.11793899536132812, -0.11337089538574219, -0.10880279541015625, -0.10423469543457031, -0.09966659545898438, -0.09509849548339844, -0.0905303955078125, -0.08596229553222656, -0.08139419555664062, -0.07682609558105469, -0.07225799560546875, -0.06768989562988281, -0.06312179565429688, -0.05855369567871094, -0.053985595703125, -0.04941749572753906, -0.044849395751953125, -0.04028129577636719, -0.03571319580078125, -0.031145095825195312, -0.026576995849609375, -0.022008895874023438, -0.0174407958984375, -0.012872695922851562, -0.008304595947265625, -0.0037364959716796875, 0.00083160400390625, 0.0053997039794921875, 0.009967803955078125, 0.014535903930664062, 0.01910400390625, 0.023672103881835938, 0.028240203857421875, 0.03280830383300781, 0.03737640380859375, 0.04194450378417969, 0.046512603759765625, 0.05108070373535156, 0.0556488037109375, 0.06021690368652344, 0.06478500366210938, 0.06935310363769531, 0.07392120361328125, 0.07848930358886719, 0.08305740356445312, 0.08762550354003906, 0.092193603515625, 0.09676170349121094, 0.10132980346679688, 0.10589790344238281, 0.11046600341796875, 0.11503410339355469, 0.11960220336914062, 0.12417030334472656, 0.1287384033203125, 0.13330650329589844, 0.13787460327148438, 0.1424427032470703, 0.14701080322265625, 0.1515789031982422, 0.15614700317382812, 0.16071510314941406, 0.165283203125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 5.0, 2.0, 2.0, 5.0, 4.0, 6.0, 9.0, 7.0, 14.0, 18.0, 27.0, 46.0, 69.0, 96.0, 136.0, 224.0, 366.0, 629.0, 1295.0, 3302.0, 11767.0, 74097.0, 798402.0, 132942.0, 17000.0, 4407.0, 1621.0, 751.0, 476.0, 280.0, 172.0, 126.0, 85.0, 47.0, 25.0, 19.0, 20.0, 15.0, 11.0, 6.0, 10.0, 7.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.45751953125, -0.4439125061035156, -0.43030548095703125, -0.4166984558105469, -0.4030914306640625, -0.3894844055175781, -0.37587738037109375, -0.3622703552246094, -0.348663330078125, -0.3350563049316406, -0.32144927978515625, -0.3078422546386719, -0.2942352294921875, -0.2806282043457031, -0.26702117919921875, -0.2534141540527344, -0.23980712890625, -0.22620010375976562, -0.21259307861328125, -0.19898605346679688, -0.1853790283203125, -0.17177200317382812, -0.15816497802734375, -0.14455795288085938, -0.130950927734375, -0.11734390258789062, -0.10373687744140625, -0.09012985229492188, -0.0765228271484375, -0.06291580200195312, -0.04930877685546875, -0.035701751708984375, -0.0220947265625, -0.008487701416015625, 0.00511932373046875, 0.018726348876953125, 0.0323333740234375, 0.045940399169921875, 0.05954742431640625, 0.07315444946289062, 0.086761474609375, 0.10036849975585938, 0.11397552490234375, 0.12758255004882812, 0.1411895751953125, 0.15479660034179688, 0.16840362548828125, 0.18201065063476562, 0.19561767578125, 0.20922470092773438, 0.22283172607421875, 0.23643875122070312, 0.2500457763671875, 0.2636528015136719, 0.27725982666015625, 0.2908668518066406, 0.304473876953125, 0.3180809020996094, 0.33168792724609375, 0.3452949523925781, 0.3589019775390625, 0.3725090026855469, 0.38611602783203125, 0.3997230529785156, 0.413330078125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 5.0, 6.0, 10.0, 1.0, 7.0, 13.0, 23.0, 16.0, 12.0, 20.0, 28.0, 31.0, 33.0, 36.0, 49.0, 36.0, 55.0, 60.0, 62.0, 51.0, 59.0, 56.0, 46.0, 42.0, 28.0, 47.0, 31.0, 28.0, 31.0, 22.0, 8.0, 10.0, 11.0, 7.0, 8.0, 3.0, 2.0, 3.0, 3.0, 2.0, 1.0, 5.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.7158203125, -0.6964263916015625, -0.677032470703125, -0.6576385498046875, -0.63824462890625, -0.6188507080078125, -0.599456787109375, -0.5800628662109375, -0.5606689453125, -0.5412750244140625, -0.521881103515625, -0.5024871826171875, -0.48309326171875, -0.4636993408203125, -0.444305419921875, -0.4249114990234375, -0.405517578125, -0.3861236572265625, -0.366729736328125, -0.3473358154296875, -0.32794189453125, -0.3085479736328125, -0.289154052734375, -0.2697601318359375, -0.2503662109375, -0.2309722900390625, -0.211578369140625, -0.1921844482421875, -0.17279052734375, -0.1533966064453125, -0.134002685546875, -0.1146087646484375, -0.09521484375, -0.0758209228515625, -0.056427001953125, -0.0370330810546875, -0.01763916015625, 0.0017547607421875, 0.021148681640625, 0.0405426025390625, 0.0599365234375, 0.0793304443359375, 0.098724365234375, 0.1181182861328125, 0.13751220703125, 0.1569061279296875, 0.176300048828125, 0.1956939697265625, 0.215087890625, 0.2344818115234375, 0.253875732421875, 0.2732696533203125, 0.29266357421875, 0.3120574951171875, 0.331451416015625, 0.3508453369140625, 0.3702392578125, 0.3896331787109375, 0.409027099609375, 0.4284210205078125, 0.44781494140625, 0.4672088623046875, 0.486602783203125, 0.5059967041015625, 0.525390625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 4.0, 6.0, 6.0, 10.0, 20.0, 17.0, 36.0, 52.0, 86.0, 128.0, 227.0, 408.0, 773.0, 1749.0, 4377.0, 12799.0, 48759.0, 425663.0, 483622.0, 49158.0, 12777.0, 4318.0, 1709.0, 840.0, 421.0, 213.0, 138.0, 73.0, 47.0, 35.0, 25.0, 12.0, 13.0, 8.0, 8.0, 5.0, 8.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.102294921875, -0.09899520874023438, -0.09569549560546875, -0.09239578247070312, -0.0890960693359375, -0.08579635620117188, -0.08249664306640625, -0.07919692993164062, -0.075897216796875, -0.07259750366210938, -0.06929779052734375, -0.06599807739257812, -0.0626983642578125, -0.059398651123046875, -0.05609893798828125, -0.052799224853515625, -0.04949951171875, -0.046199798583984375, -0.04290008544921875, -0.039600372314453125, -0.0363006591796875, -0.033000946044921875, -0.02970123291015625, -0.026401519775390625, -0.023101806640625, -0.019802093505859375, -0.01650238037109375, -0.013202667236328125, -0.0099029541015625, -0.006603240966796875, -0.00330352783203125, -3.814697265625e-06, 0.0032958984375, 0.006595611572265625, 0.00989532470703125, 0.013195037841796875, 0.0164947509765625, 0.019794464111328125, 0.02309417724609375, 0.026393890380859375, 0.029693603515625, 0.032993316650390625, 0.03629302978515625, 0.039592742919921875, 0.0428924560546875, 0.046192169189453125, 0.04949188232421875, 0.052791595458984375, 0.05609130859375, 0.059391021728515625, 0.06269073486328125, 0.06599044799804688, 0.0692901611328125, 0.07258987426757812, 0.07588958740234375, 0.07918930053710938, 0.082489013671875, 0.08578872680664062, 0.08908843994140625, 0.09238815307617188, 0.0956878662109375, 0.09898757934570312, 0.10228729248046875, 0.10558700561523438, 0.10888671875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 7.0, 11.0, 15.0, 19.0, 28.0, 42.0, 84.0, 115.0, 138.0, 125.0, 113.0, 88.0, 63.0, 45.0, 31.0, 21.0, 11.0, 10.0, 4.0, 3.0, 6.0, 5.0, 2.0, 0.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.84721565246582e-05, -5.65405935049057e-05, -5.46090304851532e-05, -5.2677467465400696e-05, -5.074590444564819e-05, -4.881434142589569e-05, -4.688277840614319e-05, -4.4951215386390686e-05, -4.3019652366638184e-05, -4.108808934688568e-05, -3.915652632713318e-05, -3.7224963307380676e-05, -3.5293400287628174e-05, -3.336183726787567e-05, -3.143027424812317e-05, -2.9498711228370667e-05, -2.7567148208618164e-05, -2.563558518886566e-05, -2.370402216911316e-05, -2.1772459149360657e-05, -1.9840896129608154e-05, -1.7909333109855652e-05, -1.597777009010315e-05, -1.4046207070350647e-05, -1.2114644050598145e-05, -1.0183081030845642e-05, -8.25151801109314e-06, -6.319954991340637e-06, -4.388391971588135e-06, -2.4568289518356323e-06, -5.252659320831299e-07, 1.4062970876693726e-06, 3.337860107421875e-06, 5.2694231271743774e-06, 7.20098614692688e-06, 9.132549166679382e-06, 1.1064112186431885e-05, 1.2995675206184387e-05, 1.492723822593689e-05, 1.6858801245689392e-05, 1.8790364265441895e-05, 2.0721927285194397e-05, 2.26534903049469e-05, 2.4585053324699402e-05, 2.6516616344451904e-05, 2.8448179364204407e-05, 3.037974238395691e-05, 3.231130540370941e-05, 3.4242868423461914e-05, 3.6174431443214417e-05, 3.810599446296692e-05, 4.003755748271942e-05, 4.1969120502471924e-05, 4.3900683522224426e-05, 4.583224654197693e-05, 4.776380956172943e-05, 4.9695372581481934e-05, 5.1626935601234436e-05, 5.355849862098694e-05, 5.549006164073944e-05, 5.742162466049194e-05, 5.9353187680244446e-05, 6.128475069999695e-05, 6.321631371974945e-05, 6.514787673950195e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 6.0, 8.0, 12.0, 14.0, 22.0, 54.0, 66.0, 118.0, 184.0, 304.0, 531.0, 1027.0, 2111.0, 5439.0, 16579.0, 62500.0, 585472.0, 296190.0, 54146.0, 14740.0, 4765.0, 1953.0, 987.0, 552.0, 277.0, 218.0, 113.0, 64.0, 37.0, 29.0, 9.0, 11.0, 5.0, 6.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.10064697265625, -0.09749698638916016, -0.09434700012207031, -0.09119701385498047, -0.08804702758789062, -0.08489704132080078, -0.08174705505371094, -0.0785970687866211, -0.07544708251953125, -0.0722970962524414, -0.06914710998535156, -0.06599712371826172, -0.06284713745117188, -0.05969715118408203, -0.05654716491699219, -0.053397178649902344, -0.0502471923828125, -0.047097206115722656, -0.04394721984863281, -0.04079723358154297, -0.037647247314453125, -0.03449726104736328, -0.03134727478027344, -0.028197288513183594, -0.02504730224609375, -0.021897315979003906, -0.018747329711914062, -0.015597343444824219, -0.012447357177734375, -0.009297370910644531, -0.0061473846435546875, -0.0029973983764648438, 0.000152587890625, 0.0033025741577148438, 0.0064525604248046875, 0.009602546691894531, 0.012752532958984375, 0.01590251922607422, 0.019052505493164062, 0.022202491760253906, 0.02535247802734375, 0.028502464294433594, 0.03165245056152344, 0.03480243682861328, 0.037952423095703125, 0.04110240936279297, 0.04425239562988281, 0.047402381896972656, 0.0505523681640625, 0.053702354431152344, 0.05685234069824219, 0.06000232696533203, 0.06315231323242188, 0.06630229949951172, 0.06945228576660156, 0.0726022720336914, 0.07575225830078125, 0.0789022445678711, 0.08205223083496094, 0.08520221710205078, 0.08835220336914062, 0.09150218963623047, 0.09465217590332031, 0.09780216217041016, 0.1009521484375]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 3.0, 1.0, 8.0, 9.0, 6.0, 6.0, 8.0, 19.0, 13.0, 24.0, 24.0, 24.0, 37.0, 54.0, 71.0, 100.0, 104.0, 87.0, 95.0, 65.0, 47.0, 52.0, 30.0, 21.0, 21.0, 20.0, 11.0, 8.0, 7.0, 8.0, 7.0, 8.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09503173828125, -0.09174251556396484, -0.08845329284667969, -0.08516407012939453, -0.08187484741210938, -0.07858562469482422, -0.07529640197753906, -0.0720071792602539, -0.06871795654296875, -0.0654287338256836, -0.06213951110839844, -0.05885028839111328, -0.055561065673828125, -0.05227184295654297, -0.04898262023925781, -0.045693397521972656, -0.0424041748046875, -0.039114952087402344, -0.03582572937011719, -0.03253650665283203, -0.029247283935546875, -0.02595806121826172, -0.022668838500976562, -0.019379615783691406, -0.01609039306640625, -0.012801170349121094, -0.009511947631835938, -0.006222724914550781, -0.002933502197265625, 0.00035572052001953125, 0.0036449432373046875, 0.006934165954589844, 0.010223388671875, 0.013512611389160156, 0.016801834106445312, 0.02009105682373047, 0.023380279541015625, 0.02666950225830078, 0.029958724975585938, 0.033247947692871094, 0.03653717041015625, 0.039826393127441406, 0.04311561584472656, 0.04640483856201172, 0.049694061279296875, 0.05298328399658203, 0.05627250671386719, 0.059561729431152344, 0.0628509521484375, 0.06614017486572266, 0.06942939758300781, 0.07271862030029297, 0.07600784301757812, 0.07929706573486328, 0.08258628845214844, 0.0858755111694336, 0.08916473388671875, 0.0924539566040039, 0.09574317932128906, 0.09903240203857422, 0.10232162475585938, 0.10561084747314453, 0.10890007019042969, 0.11218929290771484, 0.115478515625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 5.0, 4.0, 5.0, 14.0, 24.0, 49.0, 84.0, 184.0, 397.0, 136.0, 44.0, 33.0, 14.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.743709087371826, -5.617029190063477, -5.490349292755127, -5.363669395446777, -5.236989498138428, -5.110309600830078, -4.9836297035217285, -4.856949806213379, -4.730269432067871, -4.6035895347595215, -4.476909637451172, -4.350229740142822, -4.223549842834473, -4.096869945526123, -3.9701898097991943, -3.8435099124908447, -3.716830253601074, -3.5901503562927246, -3.463470458984375, -3.3367905616760254, -3.210110664367676, -3.083430767059326, -2.9567506313323975, -2.830070734024048, -2.7033908367156982, -2.5767109394073486, -2.450031042098999, -2.3233511447906494, -2.1966710090637207, -2.069991111755371, -1.9433112144470215, -1.8166313171386719, -1.6899516582489014, -1.5632717609405518, -1.4365918636322021, -1.309911847114563, -1.1832319498062134, -1.0565520524978638, -0.9298720955848694, -0.803192138671875, -0.6765122413635254, -0.5498323440551758, -0.4231523871421814, -0.2964724600315094, -0.1697925329208374, -0.04311263561248779, 0.08356732130050659, 0.21024727821350098, 0.3369271755218506, 0.4636071026325226, 0.5902870297431946, 0.716966986656189, 0.8436468839645386, 0.9703267812728882, 1.0970067977905273, 1.223686695098877, 1.3503665924072266, 1.4770464897155762, 1.6037263870239258, 1.730406403541565, 1.8570863008499146, 1.9837661981582642, 2.1104462146759033, 2.237126111984253, 2.3638060092926025]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 3.0, 3.0, 7.0, 11.0, 12.0, 8.0, 13.0, 14.0, 22.0, 23.0, 28.0, 31.0, 25.0, 33.0, 28.0, 45.0, 96.0, 132.0, 123.0, 56.0, 43.0, 28.0, 35.0, 33.0, 34.0, 16.0, 23.0, 17.0, 8.0, 10.0, 10.0, 4.0, 9.0, 7.0, 4.0, 1.0, 6.0, 4.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0], "bins": [-2.7638497352600098, -2.688305377960205, -2.6127607822418213, -2.5372164249420166, -2.461671829223633, -2.386127471923828, -2.3105831146240234, -2.2350385189056396, -2.159494161605835, -2.0839498043060303, -2.0084052085876465, -1.9328608512878418, -1.8573163747787476, -1.7817718982696533, -1.706227421760559, -1.6306829452514648, -1.5551384687423706, -1.4795939922332764, -1.4040495157241821, -1.328505039215088, -1.2529606819152832, -1.177416205406189, -1.1018717288970947, -1.02632737159729, -0.950782835483551, -0.8752383589744568, -0.7996939420700073, -0.7241494655609131, -0.6486049890518188, -0.5730605721473694, -0.49751609563827515, -0.4219716787338257, -0.34642720222473145, -0.2708827555179596, -0.19533829391002655, -0.1197938323020935, -0.044249385595321655, 0.031295061111450195, 0.10683953762054443, 0.1823839545249939, 0.25792843103408813, 0.33347287774086, 0.40901732444763184, 0.4845618009567261, 0.5601062774658203, 0.6356506943702698, 0.711195170879364, 0.7867395877838135, 0.8622840642929077, 0.937828540802002, 1.0133730173110962, 1.0889174938201904, 1.1644618511199951, 1.2400063276290894, 1.3155508041381836, 1.3910951614379883, 1.466639757156372, 1.5421842336654663, 1.6177287101745605, 1.6932730674743652, 1.7688175439834595, 1.8443620204925537, 1.919906497001648, 1.9954509735107422, 2.070995330810547]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 4.0, 6.0, 4.0, 4.0, 3.0, 5.0, 11.0, 12.0, 6.0, 12.0, 9.0, 26.0, 22.0, 41.0, 42.0, 58.0, 83.0, 170.0, 222.0, 395.0, 752.0, 1396.0, 2923.0, 7093.0, 20880.0, 74194.0, 356379.0, 1698814.0, 1597046.0, 332861.0, 69171.0, 19093.0, 6820.0, 2717.0, 1316.0, 672.0, 366.0, 233.0, 114.0, 99.0, 50.0, 42.0, 23.0, 21.0, 18.0, 14.0, 16.0, 10.0, 4.0, 7.0, 5.0, 4.0, 2.0, 3.0, 0.0, 1.0], "bins": [-0.344482421875, -0.33490753173828125, -0.3253326416015625, -0.31575775146484375, -0.306182861328125, -0.29660797119140625, -0.2870330810546875, -0.27745819091796875, -0.26788330078125, -0.25830841064453125, -0.2487335205078125, -0.23915863037109375, -0.229583740234375, -0.22000885009765625, -0.2104339599609375, -0.20085906982421875, -0.1912841796875, -0.18170928955078125, -0.1721343994140625, -0.16255950927734375, -0.152984619140625, -0.14340972900390625, -0.1338348388671875, -0.12425994873046875, -0.11468505859375, -0.10511016845703125, -0.0955352783203125, -0.08596038818359375, -0.076385498046875, -0.06681060791015625, -0.0572357177734375, -0.04766082763671875, -0.0380859375, -0.02851104736328125, -0.0189361572265625, -0.00936126708984375, 0.000213623046875, 0.00978851318359375, 0.0193634033203125, 0.02893829345703125, 0.03851318359375, 0.04808807373046875, 0.0576629638671875, 0.06723785400390625, 0.076812744140625, 0.08638763427734375, 0.0959625244140625, 0.10553741455078125, 0.1151123046875, 0.12468719482421875, 0.1342620849609375, 0.14383697509765625, 0.153411865234375, 0.16298675537109375, 0.1725616455078125, 0.18213653564453125, 0.19171142578125, 0.20128631591796875, 0.2108612060546875, 0.22043609619140625, 0.230010986328125, 0.23958587646484375, 0.2491607666015625, 0.25873565673828125, 0.268310546875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 6.0, 2.0, 3.0, 4.0, 6.0, 9.0, 9.0, 9.0, 17.0, 14.0, 16.0, 20.0, 33.0, 32.0, 31.0, 27.0, 35.0, 41.0, 37.0, 47.0, 39.0, 41.0, 53.0, 46.0, 48.0, 37.0, 31.0, 49.0, 43.0, 36.0, 39.0, 33.0, 23.0, 20.0, 16.0, 10.0, 7.0, 9.0, 7.0, 6.0, 5.0, 4.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.132568359375, -0.1278705596923828, -0.12317276000976562, -0.11847496032714844, -0.11377716064453125, -0.10907936096191406, -0.10438156127929688, -0.09968376159667969, -0.0949859619140625, -0.09028816223144531, -0.08559036254882812, -0.08089256286621094, -0.07619476318359375, -0.07149696350097656, -0.06679916381835938, -0.06210136413574219, -0.057403564453125, -0.05270576477050781, -0.048007965087890625, -0.04331016540527344, -0.03861236572265625, -0.03391456604003906, -0.029216766357421875, -0.024518966674804688, -0.0198211669921875, -0.015123367309570312, -0.010425567626953125, -0.0057277679443359375, -0.00102996826171875, 0.0036678314208984375, 0.008365631103515625, 0.013063430786132812, 0.01776123046875, 0.022459030151367188, 0.027156829833984375, 0.03185462951660156, 0.03655242919921875, 0.04125022888183594, 0.045948028564453125, 0.05064582824707031, 0.0553436279296875, 0.06004142761230469, 0.06473922729492188, 0.06943702697753906, 0.07413482666015625, 0.07883262634277344, 0.08353042602539062, 0.08822822570800781, 0.092926025390625, 0.09762382507324219, 0.10232162475585938, 0.10701942443847656, 0.11171722412109375, 0.11641502380371094, 0.12111282348632812, 0.1258106231689453, 0.1305084228515625, 0.1352062225341797, 0.13990402221679688, 0.14460182189941406, 0.14929962158203125, 0.15399742126464844, 0.15869522094726562, 0.1633930206298828, 0.1680908203125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 4.0, 7.0, 10.0, 16.0, 23.0, 28.0, 59.0, 74.0, 178.0, 375.0, 791.0, 2402.0, 21277.0, 3996459.0, 165708.0, 4704.0, 1216.0, 465.0, 227.0, 104.0, 80.0, 24.0, 16.0, 7.0, 11.0, 3.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4765625, -1.4268646240234375, -1.377166748046875, -1.3274688720703125, -1.27777099609375, -1.2280731201171875, -1.178375244140625, -1.1286773681640625, -1.0789794921875, -1.0292816162109375, -0.979583740234375, -0.9298858642578125, -0.88018798828125, -0.8304901123046875, -0.780792236328125, -0.7310943603515625, -0.681396484375, -0.6316986083984375, -0.582000732421875, -0.5323028564453125, -0.48260498046875, -0.4329071044921875, -0.383209228515625, -0.3335113525390625, -0.2838134765625, -0.2341156005859375, -0.184417724609375, -0.1347198486328125, -0.08502197265625, -0.0353240966796875, 0.014373779296875, 0.0640716552734375, 0.11376953125, 0.1634674072265625, 0.213165283203125, 0.2628631591796875, 0.31256103515625, 0.3622589111328125, 0.411956787109375, 0.4616546630859375, 0.5113525390625, 0.5610504150390625, 0.610748291015625, 0.6604461669921875, 0.71014404296875, 0.7598419189453125, 0.809539794921875, 0.8592376708984375, 0.908935546875, 0.9586334228515625, 1.008331298828125, 1.0580291748046875, 1.10772705078125, 1.1574249267578125, 1.207122802734375, 1.2568206787109375, 1.3065185546875, 1.3562164306640625, 1.405914306640625, 1.4556121826171875, 1.50531005859375, 1.5550079345703125, 1.604705810546875, 1.6544036865234375, 1.7041015625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 6.0, 12.0, 17.0, 30.0, 59.0, 121.0, 180.0, 368.0, 626.0, 867.0, 799.0, 439.0, 244.0, 145.0, 81.0, 40.0, 20.0, 16.0, 7.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0927734375, -1.0622177124023438, -1.0316619873046875, -1.0011062622070312, -0.970550537109375, -0.9399948120117188, -0.9094390869140625, -0.8788833618164062, -0.84832763671875, -0.8177719116210938, -0.7872161865234375, -0.7566604614257812, -0.726104736328125, -0.6955490112304688, -0.6649932861328125, -0.6344375610351562, -0.6038818359375, -0.5733261108398438, -0.5427703857421875, -0.5122146606445312, -0.481658935546875, -0.45110321044921875, -0.4205474853515625, -0.38999176025390625, -0.35943603515625, -0.32888031005859375, -0.2983245849609375, -0.26776885986328125, -0.237213134765625, -0.20665740966796875, -0.1761016845703125, -0.14554595947265625, -0.114990234375, -0.08443450927734375, -0.0538787841796875, -0.02332305908203125, 0.007232666015625, 0.03778839111328125, 0.0683441162109375, 0.09889984130859375, 0.12945556640625, 0.16001129150390625, 0.1905670166015625, 0.22112274169921875, 0.251678466796875, 0.28223419189453125, 0.3127899169921875, 0.34334564208984375, 0.3739013671875, 0.40445709228515625, 0.4350128173828125, 0.46556854248046875, 0.496124267578125, 0.5266799926757812, 0.5572357177734375, 0.5877914428710938, 0.61834716796875, 0.6489028930664062, 0.6794586181640625, 0.7100143432617188, 0.740570068359375, 0.7711257934570312, 0.8016815185546875, 0.8322372436523438, 0.86279296875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 4.0, 9.0, 20.0, 34.0, 61.0, 133.0, 219.0, 245.0, 133.0, 71.0, 24.0, 20.0, 13.0, 2.0, 1.0, 6.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.410016059875488, -6.1209869384765625, -5.831958293914795, -5.542929172515869, -5.253900527954102, -4.964871406555176, -4.67584228515625, -4.386813163757324, -4.097784519195557, -3.80875563621521, -3.5197267532348633, -3.2306976318359375, -2.941668748855591, -2.652639865875244, -2.3636107444763184, -2.0745818614959717, -1.785552978515625, -1.4965240955352783, -1.207495093345642, -0.9184661507606506, -0.6294372081756592, -0.3404083251953125, -0.05137932300567627, 0.23764967918395996, 0.5266785621643066, 0.8157075047492981, 1.1047364473342896, 1.3937654495239258, 1.6827943325042725, 1.9718232154846191, 2.260852336883545, 2.5498812198638916, 2.8389110565185547, 3.1279399394989014, 3.416968822479248, 3.705997943878174, 3.9950268268585205, 4.284055709838867, 4.573084831237793, 4.862113952636719, 5.151142597198486, 5.440171718597412, 5.72920036315918, 6.0182294845581055, 6.307258605957031, 6.596287250518799, 6.885316371917725, 7.174345016479492, 7.463374137878418, 7.752403259277344, 8.04143238067627, 8.330460548400879, 8.619489669799805, 8.90851879119873, 9.197547912597656, 9.486577033996582, 9.775606155395508, 10.064635276794434, 10.35366439819336, 10.642692565917969, 10.931721687316895, 11.22075080871582, 11.509779930114746, 11.798809051513672, 12.087837219238281]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 6.0, 3.0, 7.0, 9.0, 4.0, 14.0, 17.0, 14.0, 22.0, 17.0, 25.0, 28.0, 28.0, 22.0, 30.0, 33.0, 48.0, 41.0, 47.0, 47.0, 56.0, 53.0, 41.0, 35.0, 40.0, 39.0, 35.0, 33.0, 17.0, 28.0, 22.0, 24.0, 15.0, 23.0, 17.0, 10.0, 10.0, 14.0, 5.0, 6.0, 8.0, 5.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.464331865310669, -2.3768444061279297, -2.2893569469451904, -2.201869487762451, -2.114382028579712, -2.0268945693969727, -1.9394069910049438, -1.8519195318222046, -1.7644320726394653, -1.676944613456726, -1.5894571542739868, -1.501969575881958, -1.4144821166992188, -1.3269946575164795, -1.2395071983337402, -1.152019739151001, -1.0645322799682617, -0.9770448207855225, -0.8895573616027832, -0.8020698428153992, -0.7145823836326599, -0.6270949244499207, -0.5396074056625366, -0.45211994647979736, -0.3646324872970581, -0.27714502811431885, -0.1896575391292572, -0.10217005014419556, -0.014682590961456299, 0.07280486822128296, 0.160292387008667, 0.24777984619140625, 0.3352675437927246, 0.42275500297546387, 0.5102424621582031, 0.5977299809455872, 0.6852174401283264, 0.7727048993110657, 0.8601924180984497, 0.947679877281189, 1.0351673364639282, 1.1226547956466675, 1.2101422548294067, 1.2976298332214355, 1.3851172924041748, 1.472604751586914, 1.5600922107696533, 1.6475796699523926, 1.7350671291351318, 1.822554588317871, 1.9100420475006104, 1.9975295066833496, 2.085016965866089, 2.172504425048828, 2.2599921226501465, 2.3474793434143066, 2.434967041015625, 2.5224545001983643, 2.6099419593811035, 2.6974294185638428, 2.784916877746582, 2.8724043369293213, 2.9598917961120605, 3.047379493713379, 3.134866714477539]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 9.0, 5.0, 9.0, 10.0, 12.0, 27.0, 32.0, 55.0, 72.0, 115.0, 165.0, 263.0, 434.0, 694.0, 1090.0, 1889.0, 3451.0, 6634.0, 13385.0, 32593.0, 92773.0, 378092.0, 366202.0, 90311.0, 31982.0, 13583.0, 6434.0, 3361.0, 1946.0, 1103.0, 653.0, 389.0, 245.0, 194.0, 117.0, 63.0, 56.0, 33.0, 33.0, 10.0, 9.0, 7.0, 7.0, 2.0, 6.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.222900390625, -0.21570777893066406, -0.20851516723632812, -0.2013225555419922, -0.19412994384765625, -0.1869373321533203, -0.17974472045898438, -0.17255210876464844, -0.1653594970703125, -0.15816688537597656, -0.15097427368164062, -0.1437816619873047, -0.13658905029296875, -0.1293964385986328, -0.12220382690429688, -0.11501121520996094, -0.107818603515625, -0.10062599182128906, -0.09343338012695312, -0.08624076843261719, -0.07904815673828125, -0.07185554504394531, -0.06466293334960938, -0.05747032165527344, -0.0502777099609375, -0.04308509826660156, -0.035892486572265625, -0.028699874877929688, -0.02150726318359375, -0.014314651489257812, -0.007122039794921875, 7.05718994140625e-05, 0.00726318359375, 0.014455795288085938, 0.021648406982421875, 0.028841018676757812, 0.03603363037109375, 0.04322624206542969, 0.050418853759765625, 0.05761146545410156, 0.0648040771484375, 0.07199668884277344, 0.07918930053710938, 0.08638191223144531, 0.09357452392578125, 0.10076713562011719, 0.10795974731445312, 0.11515235900878906, 0.122344970703125, 0.12953758239746094, 0.13673019409179688, 0.1439228057861328, 0.15111541748046875, 0.1583080291748047, 0.16550064086914062, 0.17269325256347656, 0.1798858642578125, 0.18707847595214844, 0.19427108764648438, 0.2014636993408203, 0.20865631103515625, 0.2158489227294922, 0.22304153442382812, 0.23023414611816406, 0.2374267578125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 3.0, 3.0, 6.0, 7.0, 16.0, 12.0, 17.0, 15.0, 24.0, 33.0, 29.0, 37.0, 49.0, 61.0, 70.0, 56.0, 39.0, 49.0, 55.0, 59.0, 58.0, 40.0, 39.0, 40.0, 39.0, 34.0, 16.0, 20.0, 20.0, 21.0, 9.0, 7.0, 8.0, 7.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.219482421875, -0.21088027954101562, -0.20227813720703125, -0.19367599487304688, -0.1850738525390625, -0.17647171020507812, -0.16786956787109375, -0.15926742553710938, -0.150665283203125, -0.14206314086914062, -0.13346099853515625, -0.12485885620117188, -0.1162567138671875, -0.10765457153320312, -0.09905242919921875, -0.09045028686523438, -0.08184814453125, -0.07324600219726562, -0.06464385986328125, -0.056041717529296875, -0.0474395751953125, -0.038837432861328125, -0.03023529052734375, -0.021633148193359375, -0.013031005859375, -0.004428863525390625, 0.00417327880859375, 0.012775421142578125, 0.0213775634765625, 0.029979705810546875, 0.03858184814453125, 0.047183990478515625, 0.0557861328125, 0.06438827514648438, 0.07299041748046875, 0.08159255981445312, 0.0901947021484375, 0.09879684448242188, 0.10739898681640625, 0.11600112915039062, 0.124603271484375, 0.13320541381835938, 0.14180755615234375, 0.15040969848632812, 0.1590118408203125, 0.16761398315429688, 0.17621612548828125, 0.18481826782226562, 0.19342041015625, 0.20202255249023438, 0.21062469482421875, 0.21922683715820312, 0.2278289794921875, 0.23643112182617188, 0.24503326416015625, 0.2536354064941406, 0.262237548828125, 0.2708396911621094, 0.27944183349609375, 0.2880439758300781, 0.2966461181640625, 0.3052482604980469, 0.31385040283203125, 0.3224525451660156, 0.3310546875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 6.0, 5.0, 2.0, 7.0, 9.0, 6.0, 24.0, 32.0, 47.0, 85.0, 160.0, 374.0, 971.0, 4140.0, 44484.0, 951071.0, 41410.0, 3970.0, 982.0, 362.0, 165.0, 101.0, 62.0, 28.0, 17.0, 12.0, 12.0, 6.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6728515625, -0.6521377563476562, -0.6314239501953125, -0.6107101440429688, -0.589996337890625, -0.5692825317382812, -0.5485687255859375, -0.5278549194335938, -0.50714111328125, -0.48642730712890625, -0.4657135009765625, -0.44499969482421875, -0.424285888671875, -0.40357208251953125, -0.3828582763671875, -0.36214447021484375, -0.3414306640625, -0.32071685791015625, -0.3000030517578125, -0.27928924560546875, -0.258575439453125, -0.23786163330078125, -0.2171478271484375, -0.19643402099609375, -0.17572021484375, -0.15500640869140625, -0.1342926025390625, -0.11357879638671875, -0.092864990234375, -0.07215118408203125, -0.0514373779296875, -0.03072357177734375, -0.010009765625, 0.01070404052734375, 0.0314178466796875, 0.05213165283203125, 0.072845458984375, 0.09355926513671875, 0.1142730712890625, 0.13498687744140625, 0.15570068359375, 0.17641448974609375, 0.1971282958984375, 0.21784210205078125, 0.238555908203125, 0.25926971435546875, 0.2799835205078125, 0.30069732666015625, 0.3214111328125, 0.34212493896484375, 0.3628387451171875, 0.38355255126953125, 0.404266357421875, 0.42498016357421875, 0.4456939697265625, 0.46640777587890625, 0.48712158203125, 0.5078353881835938, 0.5285491943359375, 0.5492630004882812, 0.569976806640625, 0.5906906127929688, 0.6114044189453125, 0.6321182250976562, 0.65283203125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 5.0, 6.0, 6.0, 9.0, 12.0, 13.0, 10.0, 13.0, 22.0, 23.0, 24.0, 48.0, 44.0, 65.0, 70.0, 106.0, 86.0, 72.0, 78.0, 45.0, 42.0, 35.0, 30.0, 27.0, 27.0, 19.0, 10.0, 13.0, 11.0, 9.0, 8.0, 7.0, 2.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.2373046875, -1.2040176391601562, -1.1707305908203125, -1.1374435424804688, -1.104156494140625, -1.0708694458007812, -1.0375823974609375, -1.0042953491210938, -0.97100830078125, -0.9377212524414062, -0.9044342041015625, -0.8711471557617188, -0.837860107421875, -0.8045730590820312, -0.7712860107421875, -0.7379989624023438, -0.7047119140625, -0.6714248657226562, -0.6381378173828125, -0.6048507690429688, -0.571563720703125, -0.5382766723632812, -0.5049896240234375, -0.47170257568359375, -0.43841552734375, -0.40512847900390625, -0.3718414306640625, -0.33855438232421875, -0.305267333984375, -0.27198028564453125, -0.2386932373046875, -0.20540618896484375, -0.172119140625, -0.13883209228515625, -0.1055450439453125, -0.07225799560546875, -0.038970947265625, -0.00568389892578125, 0.0276031494140625, 0.06089019775390625, 0.09417724609375, 0.12746429443359375, 0.1607513427734375, 0.19403839111328125, 0.227325439453125, 0.26061248779296875, 0.2938995361328125, 0.32718658447265625, 0.3604736328125, 0.39376068115234375, 0.4270477294921875, 0.46033477783203125, 0.493621826171875, 0.5269088745117188, 0.5601959228515625, 0.5934829711914062, 0.62677001953125, 0.6600570678710938, 0.6933441162109375, 0.7266311645507812, 0.759918212890625, 0.7932052612304688, 0.8264923095703125, 0.8597793579101562, 0.89306640625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 6.0, 7.0, 5.0, 10.0, 17.0, 21.0, 38.0, 42.0, 72.0, 120.0, 210.0, 409.0, 1003.0, 3074.0, 13674.0, 138764.0, 854233.0, 28873.0, 5202.0, 1471.0, 588.0, 260.0, 153.0, 94.0, 56.0, 45.0, 36.0, 18.0, 19.0, 12.0, 9.0, 5.0, 2.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.09600830078125, -0.09260272979736328, -0.08919715881347656, -0.08579158782958984, -0.08238601684570312, -0.0789804458618164, -0.07557487487792969, -0.07216930389404297, -0.06876373291015625, -0.06535816192626953, -0.06195259094238281, -0.058547019958496094, -0.055141448974609375, -0.051735877990722656, -0.04833030700683594, -0.04492473602294922, -0.0415191650390625, -0.03811359405517578, -0.03470802307128906, -0.031302452087402344, -0.027896881103515625, -0.024491310119628906, -0.021085739135742188, -0.01768016815185547, -0.01427459716796875, -0.010869026184082031, -0.0074634552001953125, -0.004057884216308594, -0.000652313232421875, 0.0027532577514648438, 0.0061588287353515625, 0.009564399719238281, 0.012969970703125, 0.01637554168701172, 0.019781112670898438, 0.023186683654785156, 0.026592254638671875, 0.029997825622558594, 0.03340339660644531, 0.03680896759033203, 0.04021453857421875, 0.04362010955810547, 0.04702568054199219, 0.050431251525878906, 0.053836822509765625, 0.057242393493652344, 0.06064796447753906, 0.06405353546142578, 0.0674591064453125, 0.07086467742919922, 0.07427024841308594, 0.07767581939697266, 0.08108139038085938, 0.0844869613647461, 0.08789253234863281, 0.09129810333251953, 0.09470367431640625, 0.09810924530029297, 0.10151481628417969, 0.1049203872680664, 0.10832595825195312, 0.11173152923583984, 0.11513710021972656, 0.11854267120361328, 0.1219482421875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 5.0, 3.0, 6.0, 14.0, 6.0, 12.0, 12.0, 13.0, 15.0, 16.0, 15.0, 24.0, 33.0, 44.0, 48.0, 64.0, 64.0, 75.0, 74.0, 85.0, 53.0, 53.0, 48.0, 33.0, 33.0, 26.0, 24.0, 15.0, 15.0, 12.0, 8.0, 9.0, 6.0, 11.0, 9.0, 4.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.0994415283203125e-05, -2.9935501515865326e-05, -2.8876587748527527e-05, -2.7817673981189728e-05, -2.675876021385193e-05, -2.569984644651413e-05, -2.464093267917633e-05, -2.358201891183853e-05, -2.2523105144500732e-05, -2.1464191377162933e-05, -2.0405277609825134e-05, -1.9346363842487335e-05, -1.8287450075149536e-05, -1.7228536307811737e-05, -1.6169622540473938e-05, -1.5110708773136139e-05, -1.405179500579834e-05, -1.299288123846054e-05, -1.1933967471122742e-05, -1.0875053703784943e-05, -9.816139936447144e-06, -8.757226169109344e-06, -7.698312401771545e-06, -6.639398634433746e-06, -5.580484867095947e-06, -4.521571099758148e-06, -3.462657332420349e-06, -2.40374356508255e-06, -1.344829797744751e-06, -2.859160304069519e-07, 7.729977369308472e-07, 1.8319115042686462e-06, 2.8908252716064453e-06, 3.949739038944244e-06, 5.0086528062820435e-06, 6.0675665736198425e-06, 7.126480340957642e-06, 8.18539410829544e-06, 9.24430787563324e-06, 1.0303221642971039e-05, 1.1362135410308838e-05, 1.2421049177646637e-05, 1.3479962944984436e-05, 1.4538876712322235e-05, 1.5597790479660034e-05, 1.6656704246997833e-05, 1.7715618014335632e-05, 1.877453178167343e-05, 1.983344554901123e-05, 2.089235931634903e-05, 2.195127308368683e-05, 2.3010186851024628e-05, 2.4069100618362427e-05, 2.5128014385700226e-05, 2.6186928153038025e-05, 2.7245841920375824e-05, 2.8304755687713623e-05, 2.9363669455051422e-05, 3.042258322238922e-05, 3.148149698972702e-05, 3.254041075706482e-05, 3.359932452440262e-05, 3.465823829174042e-05, 3.5717152059078217e-05, 3.6776065826416016e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 9.0, 12.0, 19.0, 22.0, 38.0, 65.0, 87.0, 162.0, 281.0, 424.0, 764.0, 1510.0, 3369.0, 8534.0, 26563.0, 140907.0, 787311.0, 54296.0, 14526.0, 5039.0, 2194.0, 1028.0, 550.0, 326.0, 199.0, 118.0, 67.0, 36.0, 32.0, 20.0, 13.0, 9.0, 5.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.08612060546875, -0.08353042602539062, -0.08094024658203125, -0.07835006713867188, -0.0757598876953125, -0.07316970825195312, -0.07057952880859375, -0.06798934936523438, -0.065399169921875, -0.06280899047851562, -0.06021881103515625, -0.057628631591796875, -0.0550384521484375, -0.052448272705078125, -0.04985809326171875, -0.047267913818359375, -0.044677734375, -0.042087554931640625, -0.03949737548828125, -0.036907196044921875, -0.0343170166015625, -0.031726837158203125, -0.02913665771484375, -0.026546478271484375, -0.023956298828125, -0.021366119384765625, -0.01877593994140625, -0.016185760498046875, -0.0135955810546875, -0.011005401611328125, -0.00841522216796875, -0.005825042724609375, -0.00323486328125, -0.000644683837890625, 0.00194549560546875, 0.004535675048828125, 0.0071258544921875, 0.009716033935546875, 0.01230621337890625, 0.014896392822265625, 0.017486572265625, 0.020076751708984375, 0.02266693115234375, 0.025257110595703125, 0.0278472900390625, 0.030437469482421875, 0.03302764892578125, 0.035617828369140625, 0.0382080078125, 0.040798187255859375, 0.04338836669921875, 0.045978546142578125, 0.0485687255859375, 0.051158905029296875, 0.05374908447265625, 0.056339263916015625, 0.058929443359375, 0.061519622802734375, 0.06410980224609375, 0.06669998168945312, 0.0692901611328125, 0.07188034057617188, 0.07447052001953125, 0.07706069946289062, 0.07965087890625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 3.0, 7.0, 2.0, 7.0, 16.0, 13.0, 12.0, 13.0, 16.0, 30.0, 38.0, 79.0, 110.0, 124.0, 156.0, 109.0, 70.0, 50.0, 37.0, 19.0, 14.0, 12.0, 14.0, 7.0, 4.0, 9.0, 4.0, 3.0, 4.0, 3.0, 1.0, 1.0, 4.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.10992431640625, -0.10679149627685547, -0.10365867614746094, -0.1005258560180664, -0.09739303588867188, -0.09426021575927734, -0.09112739562988281, -0.08799457550048828, -0.08486175537109375, -0.08172893524169922, -0.07859611511230469, -0.07546329498291016, -0.07233047485351562, -0.0691976547241211, -0.06606483459472656, -0.06293201446533203, -0.0597991943359375, -0.05666637420654297, -0.05353355407714844, -0.050400733947753906, -0.047267913818359375, -0.044135093688964844, -0.04100227355957031, -0.03786945343017578, -0.03473663330078125, -0.03160381317138672, -0.028470993041992188, -0.025338172912597656, -0.022205352783203125, -0.019072532653808594, -0.015939712524414062, -0.012806892395019531, -0.009674072265625, -0.006541252136230469, -0.0034084320068359375, -0.00027561187744140625, 0.002857208251953125, 0.005990028381347656, 0.009122848510742188, 0.012255668640136719, 0.01538848876953125, 0.01852130889892578, 0.021654129028320312, 0.024786949157714844, 0.027919769287109375, 0.031052589416503906, 0.03418540954589844, 0.03731822967529297, 0.0404510498046875, 0.04358386993408203, 0.04671669006347656, 0.049849510192871094, 0.052982330322265625, 0.056115150451660156, 0.05924797058105469, 0.06238079071044922, 0.06551361083984375, 0.06864643096923828, 0.07177925109863281, 0.07491207122802734, 0.07804489135742188, 0.0811777114868164, 0.08431053161621094, 0.08744335174560547, 0.090576171875]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 7.0, 18.0, 24.0, 53.0, 118.0, 509.0, 167.0, 55.0, 22.0, 16.0, 10.0, 8.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.491363048553467, -3.32965350151062, -3.1679439544677734, -3.0062344074249268, -2.84452486038208, -2.6828153133392334, -2.5211057662963867, -2.35939621925354, -2.1976866722106934, -2.0359771251678467, -1.874267578125, -1.7125580310821533, -1.5508484840393066, -1.38913893699646, -1.2274293899536133, -1.0657198429107666, -0.9040102958679199, -0.7423007488250732, -0.5805912017822266, -0.4188816547393799, -0.2571721076965332, -0.09546256065368652, 0.06624698638916016, 0.22795653343200684, 0.3896660804748535, 0.5513756275177002, 0.7130851745605469, 0.8747947216033936, 1.0365042686462402, 1.198213815689087, 1.3599233627319336, 1.5216329097747803, 1.6833429336547852, 1.8450524806976318, 2.0067620277404785, 2.168471574783325, 2.330181121826172, 2.4918906688690186, 2.6536002159118652, 2.815309762954712, 2.9770193099975586, 3.1387288570404053, 3.300438404083252, 3.4621479511260986, 3.6238574981689453, 3.785567045211792, 3.9472765922546387, 4.108985900878906, 4.270695686340332, 4.432405471801758, 4.594114780426025, 4.755824089050293, 4.917533874511719, 5.0792436599731445, 5.240952968597412, 5.40266227722168, 5.5643720626831055, 5.726081848144531, 5.887791156768799, 6.049500465393066, 6.211210250854492, 6.372920036315918, 6.5346293449401855, 6.696338653564453, 6.858048439025879]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 10.0, 4.0, 5.0, 3.0, 12.0, 7.0, 8.0, 16.0, 16.0, 18.0, 13.0, 31.0, 12.0, 27.0, 35.0, 69.0, 114.0, 147.0, 133.0, 81.0, 53.0, 26.0, 17.0, 23.0, 17.0, 17.0, 16.0, 18.0, 6.0, 12.0, 9.0, 9.0, 7.0, 3.0, 9.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6377370357513428, -2.5515856742858887, -2.4654340744018555, -2.3792827129364014, -2.2931313514709473, -2.206979990005493, -2.12082839012146, -2.034677028656006, -1.9485256671905518, -1.862374186515808, -1.776222825050354, -1.6900713443756104, -1.6039199829101562, -1.5177685022354126, -1.431617021560669, -1.3454656600952148, -1.2593141794204712, -1.1731626987457275, -1.0870113372802734, -1.0008598566055298, -0.9147084951400757, -0.828557014465332, -0.7424055933952332, -0.6562541723251343, -0.5701027512550354, -0.4839513301849365, -0.39779990911483765, -0.3116484582424164, -0.2254970371723175, -0.13934561610221863, -0.05319416522979736, 0.032957255840301514, 0.11910867691040039, 0.20526009798049927, 0.29141151905059814, 0.3775629699230194, 0.4637143909931183, 0.5498658418655396, 0.6360172629356384, 0.7221686840057373, 0.8083201050758362, 0.8944715261459351, 0.9806229472160339, 1.0667743682861328, 1.1529258489608765, 1.2390772104263306, 1.3252286911010742, 1.4113800525665283, 1.497531533241272, 1.5836830139160156, 1.6698343753814697, 1.7559858560562134, 1.8421372175216675, 1.9282886981964111, 2.0144400596618652, 2.1005916595458984, 2.1867430210113525, 2.2728943824768066, 2.35904598236084, 2.445197343826294, 2.531348705291748, 2.617500066757202, 2.7036516666412354, 2.7898030281066895, 2.8759543895721436]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 6.0, 8.0, 6.0, 9.0, 11.0, 13.0, 18.0, 17.0, 17.0, 17.0, 27.0, 25.0, 32.0, 31.0, 38.0, 47.0, 96.0, 168.0, 97.0, 50.0, 26.0, 27.0, 24.0, 26.0, 24.0, 28.0, 18.0, 17.0, 17.0, 17.0, 8.0, 8.0, 4.0, 9.0, 6.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.219482421875, -0.21248626708984375, -0.2054901123046875, -0.19849395751953125, -0.191497802734375, -0.18450164794921875, -0.1775054931640625, -0.17050933837890625, -0.16351318359375, -0.15651702880859375, -0.1495208740234375, -0.14252471923828125, -0.135528564453125, -0.12853240966796875, -0.1215362548828125, -0.11454010009765625, -0.1075439453125, -0.10054779052734375, -0.0935516357421875, -0.08655548095703125, -0.079559326171875, -0.07256317138671875, -0.0655670166015625, -0.05857086181640625, -0.05157470703125, -0.04457855224609375, -0.0375823974609375, -0.03058624267578125, -0.023590087890625, -0.01659393310546875, -0.0095977783203125, -0.00260162353515625, 0.00439453125, 0.01139068603515625, 0.0183868408203125, 0.02538299560546875, 0.032379150390625, 0.03937530517578125, 0.0463714599609375, 0.05336761474609375, 0.06036376953125, 0.06735992431640625, 0.0743560791015625, 0.08135223388671875, 0.088348388671875, 0.09534454345703125, 0.1023406982421875, 0.10933685302734375, 0.1163330078125, 0.12332916259765625, 0.1303253173828125, 0.13732147216796875, 0.144317626953125, 0.15131378173828125, 0.1583099365234375, 0.16530609130859375, 0.17230224609375, 0.17929840087890625, 0.1862945556640625, 0.19329071044921875, 0.200286865234375, 0.20728302001953125, 0.2142791748046875, 0.22127532958984375, 0.228271484375]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 8.0, 1.0, 1.0, 0.0, 4.0, 8.0, 5.0, 12.0, 9.0, 9.0, 11.0, 22.0, 18.0, 51.0, 69.0, 105.0, 217.0, 378.0, 1232.0, 5160.0, 81662.0, 8288168.0, 8507.0, 1805.0, 547.0, 220.0, 127.0, 71.0, 32.0, 39.0, 19.0, 12.0, 13.0, 10.0, 5.0, 5.0, 2.0, 5.0, 3.0, 14.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.226417064666748, -2.1664845943450928, -2.1065521240234375, -2.046619415283203, -1.9866869449615479, -1.9267544746398926, -1.8668218851089478, -1.806889295578003, -1.7469568252563477, -1.6870243549346924, -1.6270917654037476, -1.5671591758728027, -1.5072267055511475, -1.4472942352294922, -1.3873616456985474, -1.3274290561676025, -1.2674965858459473, -1.207564115524292, -1.1476315259933472, -1.0876989364624023, -1.027766466140747, -0.967833936214447, -0.907901406288147, -0.8479688763618469, -0.7880363464355469, -0.7281038165092468, -0.6681712865829468, -0.6082387566566467, -0.5483062267303467, -0.48837369680404663, -0.4284411668777466, -0.36850863695144653, -0.30857622623443604, -0.248643696308136, -0.18871116638183594, -0.1287786364555359, -0.06884610652923584, -0.008913576602935791, 0.05101895332336426, 0.1109514832496643, 0.17088401317596436, 0.2308165431022644, 0.29074907302856445, 0.3506816029548645, 0.41061413288116455, 0.4705466628074646, 0.5304791927337646, 0.5904117226600647, 0.6503442525863647, 0.7102767825126648, 0.7702093124389648, 0.8301418423652649, 0.8900743722915649, 0.950006902217865, 1.009939432144165, 1.0698719024658203, 1.1298044919967651, 1.18973708152771, 1.2496695518493652, 1.3096020221710205, 1.3695346117019653, 1.4294672012329102, 1.4893996715545654, 1.5493321418762207, 1.6092647314071655]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 5.0, 1.0, 1.0, 4.0, 6.0, 2.0, 9.0, 1.0, 4.0, 6.0, 2.0, 6.0, 7.0, 7.0, 3.0, 6.0, 3.0, 7.0, 3.0, 3.0, 0.0, 3.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.300006628036499, -2.208965301513672, -2.1179239749908447, -2.0268826484680176, -1.9358413219451904, -1.8447999954223633, -1.7537587881088257, -1.6627174615859985, -1.5716761350631714, -1.4806348085403442, -1.389593482017517, -1.2985522747039795, -1.2075109481811523, -1.1164696216583252, -1.025428295135498, -0.9343869686126709, -0.8433456420898438, -0.7523043155670166, -0.6612629890441895, -0.5702217221260071, -0.47918039560317993, -0.3881390690803528, -0.2970978021621704, -0.20605647563934326, -0.11501514911651611, -0.02397383749485016, 0.0670674741268158, 0.15810877084732056, 0.2491500973701477, 0.34019142389297485, 0.4312326908111572, 0.5222740173339844, 0.6133155822753906, 0.7043569087982178, 0.7953982353210449, 0.8864395022392273, 0.9774808287620544, 1.0685222148895264, 1.159563422203064, 1.2506047487258911, 1.3416460752487183, 1.4326874017715454, 1.5237287282943726, 1.6147699356079102, 1.7058112621307373, 1.7968525886535645, 1.8878939151763916, 1.9789352416992188, 2.069976568222046, 2.161017894744873, 2.2520592212677, 2.3431005477905273, 2.4341418743133545, 2.5251832008361816, 2.6162242889404297, 2.707265853881836, 2.798306941986084, 2.889348268508911, 2.9803895950317383, 3.0714309215545654, 3.1624722480773926, 3.2535135746002197, 3.344554901123047, 3.435595989227295, 3.526637554168701]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 4.0, 6.0, 3.0, 13.0, 13.0, 15.0, 21.0, 38.0, 23.0, 41.0, 51.0, 55.0, 51.0, 61.0, 69.0, 60.0, 60.0, 66.0, 56.0, 61.0, 59.0, 45.0, 30.0, 20.0, 16.0, 12.0, 14.0, 18.0, 8.0, 9.0, 5.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2430419921875, -0.23597145080566406, -0.22890090942382812, -0.2218303680419922, -0.21475982666015625, -0.2076892852783203, -0.20061874389648438, -0.19354820251464844, -0.1864776611328125, -0.17940711975097656, -0.17233657836914062, -0.1652660369873047, -0.15819549560546875, -0.1511249542236328, -0.14405441284179688, -0.13698387145996094, -0.129913330078125, -0.12284278869628906, -0.11577224731445312, -0.10870170593261719, -0.10163116455078125, -0.09456062316894531, -0.08749008178710938, -0.08041954040527344, -0.0733489990234375, -0.06627845764160156, -0.059207916259765625, -0.05213737487792969, -0.04506683349609375, -0.03799629211425781, -0.030925750732421875, -0.023855209350585938, -0.01678466796875, -0.009714126586914062, -0.002643585205078125, 0.0044269561767578125, 0.01149749755859375, 0.018568038940429688, 0.025638580322265625, 0.03270912170410156, 0.0397796630859375, 0.04685020446777344, 0.053920745849609375, 0.06099128723144531, 0.06806182861328125, 0.07513236999511719, 0.08220291137695312, 0.08927345275878906, 0.096343994140625, 0.10341453552246094, 0.11048507690429688, 0.11755561828613281, 0.12462615966796875, 0.1316967010498047, 0.13876724243164062, 0.14583778381347656, 0.1529083251953125, 0.15997886657714844, 0.16704940795898438, 0.1741199493408203, 0.18119049072265625, 0.1882610321044922, 0.19533157348632812, 0.20240211486816406, 0.20947265625]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 7.0, 5.0, 10.0, 13.0, 20.0, 32.0, 40.0, 47.0, 71.0, 94.0, 157.0, 267.0, 431.0, 787.0, 1625.0, 3180.0, 6979.0, 15868.0, 37509.0, 87101.0, 158705.0, 117519.0, 52331.0, 22589.0, 9903.0, 4450.0, 2066.0, 1004.0, 542.0, 305.0, 192.0, 121.0, 85.0, 51.0, 50.0, 31.0, 22.0, 16.0, 13.0, 12.0, 6.0, 5.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.98779296875, -0.9521255493164062, -0.9164581298828125, -0.8807907104492188, -0.845123291015625, -0.8094558715820312, -0.7737884521484375, -0.7381210327148438, -0.70245361328125, -0.6667861938476562, -0.6311187744140625, -0.5954513549804688, -0.559783935546875, -0.5241165161132812, -0.4884490966796875, -0.45278167724609375, -0.4171142578125, -0.38144683837890625, -0.3457794189453125, -0.31011199951171875, -0.274444580078125, -0.23877716064453125, -0.2031097412109375, -0.16744232177734375, -0.13177490234375, -0.09610748291015625, -0.0604400634765625, -0.02477264404296875, 0.010894775390625, 0.04656219482421875, 0.0822296142578125, 0.11789703369140625, 0.153564453125, 0.18923187255859375, 0.2248992919921875, 0.26056671142578125, 0.296234130859375, 0.33190155029296875, 0.3675689697265625, 0.40323638916015625, 0.43890380859375, 0.47457122802734375, 0.5102386474609375, 0.5459060668945312, 0.581573486328125, 0.6172409057617188, 0.6529083251953125, 0.6885757446289062, 0.7242431640625, 0.7599105834960938, 0.7955780029296875, 0.8312454223632812, 0.866912841796875, 0.9025802612304688, 0.9382476806640625, 0.9739151000976562, 1.00958251953125, 1.0452499389648438, 1.0809173583984375, 1.1165847778320312, 1.152252197265625, 1.1879196166992188, 1.2235870361328125, 1.2592544555664062, 1.294921875]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 5.0, 5.0, 12.0, 13.0, 13.0, 17.0, 21.0, 20.0, 37.0, 39.0, 50.0, 64.0, 61.0, 66.0, 72.0, 66.0, 56.0, 73.0, 51.0, 43.0, 44.0, 42.0, 28.0, 26.0, 22.0, 14.0, 12.0, 6.0, 10.0, 1.0, 5.0, 5.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.208984375, -0.20121002197265625, -0.1934356689453125, -0.18566131591796875, -0.177886962890625, -0.17011260986328125, -0.1623382568359375, -0.15456390380859375, -0.14678955078125, -0.13901519775390625, -0.1312408447265625, -0.12346649169921875, -0.115692138671875, -0.10791778564453125, -0.1001434326171875, -0.09236907958984375, -0.0845947265625, -0.07682037353515625, -0.0690460205078125, -0.06127166748046875, -0.053497314453125, -0.04572296142578125, -0.0379486083984375, -0.03017425537109375, -0.02239990234375, -0.01462554931640625, -0.0068511962890625, 0.00092315673828125, 0.008697509765625, 0.01647186279296875, 0.0242462158203125, 0.03202056884765625, 0.039794921875, 0.04756927490234375, 0.0553436279296875, 0.06311798095703125, 0.070892333984375, 0.07866668701171875, 0.0864410400390625, 0.09421539306640625, 0.10198974609375, 0.10976409912109375, 0.1175384521484375, 0.12531280517578125, 0.133087158203125, 0.14086151123046875, 0.1486358642578125, 0.15641021728515625, 0.1641845703125, 0.17195892333984375, 0.1797332763671875, 0.18750762939453125, 0.195281982421875, 0.20305633544921875, 0.2108306884765625, 0.21860504150390625, 0.22637939453125, 0.23415374755859375, 0.2419281005859375, 0.24970245361328125, 0.257476806640625, 0.26525115966796875, 0.2730255126953125, 0.28079986572265625, 0.28857421875]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 8.0, 3.0, 10.0, 9.0, 14.0, 49.0, 83.0, 92.0, 95.0, 51.0, 21.0, 8.0, 10.0, 4.0, 6.0, 3.0, 5.0, 0.0, 3.0, 5.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.053524971008301, -1.992791771888733, -1.932058572769165, -1.8713253736495972, -1.8105921745300293, -1.7498589754104614, -1.6891257762908936, -1.6283925771713257, -1.5676593780517578, -1.50692617893219, -1.446192979812622, -1.3854597806930542, -1.3247265815734863, -1.2639933824539185, -1.2032601833343506, -1.1425269842147827, -1.0817937850952148, -1.021060585975647, -0.9603273868560791, -0.8995941877365112, -0.8388609886169434, -0.7781277894973755, -0.7173945903778076, -0.6566613912582397, -0.5959280729293823, -0.5351948738098145, -0.4744616746902466, -0.4137284755706787, -0.35299527645111084, -0.2922620475292206, -0.2315288484096527, -0.17079564929008484, -0.11006247997283936, -0.049329277127981186, 0.011403925716876984, 0.07213713228702545, 0.13287033140659332, 0.1936035454273224, 0.25433674454689026, 0.31506994366645813, 0.375803142786026, 0.43653634190559387, 0.49726954102516174, 0.558002769947052, 0.6187359690666199, 0.6794691681861877, 0.7402023673057556, 0.8009355664253235, 0.8616687655448914, 0.9224019646644592, 0.9831351637840271, 1.0438684225082397, 1.1046016216278076, 1.1653348207473755, 1.2260680198669434, 1.2868012189865112, 1.347534418106079, 1.408267617225647, 1.4690008163452148, 1.5297340154647827, 1.5904672145843506, 1.6512004137039185, 1.7119336128234863, 1.7726668119430542, 1.833400011062622]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 4.0, 3.0, 3.0, 2.0, 7.0, 5.0, 4.0, 7.0, 7.0, 9.0, 27.0, 37.0, 65.0, 85.0, 74.0, 51.0, 23.0, 17.0, 11.0, 3.0, 6.0, 5.0, 7.0, 5.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0230109691619873, -0.9876903891563416, -0.9523698091506958, -0.91704922914505, -0.8817286491394043, -0.8464081287384033, -0.8110875487327576, -0.7757669687271118, -0.7404463887214661, -0.7051258087158203, -0.6698052287101746, -0.6344846487045288, -0.5991641283035278, -0.5638434886932373, -0.5285229682922363, -0.4932023882865906, -0.4578818082809448, -0.4225612282752991, -0.3872406482696533, -0.35192009806632996, -0.3165995180606842, -0.28127893805503845, -0.2459583729505539, -0.21063780784606934, -0.17531722784042358, -0.13999664783477783, -0.10467608273029327, -0.06935551017522812, -0.034034937620162964, 0.001285642385482788, 0.036606207489967346, 0.0719267725944519, 0.10724735260009766, 0.1425679326057434, 0.17788849771022797, 0.21320906281471252, 0.24852964282035828, 0.28385022282600403, 0.3191707730293274, 0.35449135303497314, 0.3898119330406189, 0.42513251304626465, 0.4604530930519104, 0.49577364325523376, 0.5310941934585571, 0.5664148330688477, 0.6017353534698486, 0.6370559334754944, 0.6723765134811401, 0.7076970934867859, 0.7430176734924316, 0.7783382534980774, 0.8136588335037231, 0.8489793539047241, 0.8842999339103699, 0.9196205139160156, 0.9549410939216614, 0.9902616739273071, 1.025582194328308, 1.0609028339385986, 1.0962233543395996, 1.1315439939498901, 1.1668645143508911, 1.2021851539611816, 1.2375056743621826]}, "eval/loss": 0.36502909660339355, "eval/wer": 0.11207854026180088, "eval/runtime": 567.0865, "eval/samples_per_second": 4.659, "eval/steps_per_second": 0.584} \ No newline at end of file