diff --git "a/wandb/run-20220325_193848-1sz5964i/files/wandb-summary.json" "b/wandb/run-20220325_193848-1sz5964i/files/wandb-summary.json" new file mode 100644--- /dev/null +++ "b/wandb/run-20220325_193848-1sz5964i/files/wandb-summary.json" @@ -0,0 +1 @@ +{"train/loss": 4.3539, "train/learning_rate": 0.00029759999999999997, "train/epoch": 2.24, "train/global_step": 500, "_runtime": 11642, "_timestamp": 1648248770, "_step": 500, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 411.0, 609.0], "bins": [-88.30326843261719, -86.90232849121094, -85.50139617919922, -84.10045623779297, -82.69951629638672, -81.298583984375, -79.89764404296875, -78.4967041015625, -77.09576416015625, -75.69482421875, -74.29389190673828, -72.89295196533203, -71.49201202392578, -70.09107971191406, -68.69013977050781, -67.28919982910156, -65.88826751708984, -64.4873275756836, -63.08639144897461, -61.685455322265625, -60.284515380859375, -58.88357925415039, -57.482643127441406, -56.081703186035156, -54.680763244628906, -53.27982711791992, -51.87888717651367, -50.47795104980469, -49.07701110839844, -47.67607498168945, -46.27513885498047, -44.87419891357422, -43.473262786865234, -42.07232666015625, -40.67138671875, -39.270450592041016, -37.869510650634766, -36.46857452392578, -35.06763458251953, -33.66669845581055, -32.26576232910156, -30.864824295043945, -29.463886260986328, -28.062950134277344, -26.662012100219727, -25.26107406616211, -23.860136032104492, -22.459197998046875, -21.058259963989258, -19.65732192993164, -18.256383895874023, -16.855445861816406, -15.454509735107422, -14.053571701049805, -12.652633666992188, -11.251696586608887, -9.850757598876953, -8.449819564819336, -7.048882484436035, -5.647944450378418, -4.247006893157959, -2.8460693359375, -1.4451313018798828, -0.04419422149658203, 1.356743335723877]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 6.0, 3.0, 6.0, 8.0, 5.0, 12.0, 16.0, 24.0, 16.0, 19.0, 18.0, 29.0, 43.0, 38.0, 42.0, 45.0, 40.0, 36.0, 39.0, 55.0, 50.0, 33.0, 50.0, 35.0, 38.0, 34.0, 33.0, 31.0, 25.0, 26.0, 25.0, 25.0, 14.0, 20.0, 11.0, 9.0, 7.0, 7.0, 4.0, 5.0, 2.0, 5.0, 5.0, 3.0, 3.0, 3.0, 0.0, 1.0], "bins": [-3.711008071899414, -3.6036376953125, -3.496267318725586, -3.3888967037200928, -3.2815263271331787, -3.1741559505462646, -3.0667853355407715, -2.9594149589538574, -2.8520445823669434, -2.7446742057800293, -2.6373038291931152, -2.529933214187622, -2.422562837600708, -2.315192461013794, -2.207821846008301, -2.1004514694213867, -1.9930810928344727, -1.8857107162475586, -1.778340220451355, -1.6709697246551514, -1.5635993480682373, -1.4562289714813232, -1.3488584756851196, -1.241487979888916, -1.134117603302002, -1.026747226715088, -0.9193767309188843, -0.8120062947273254, -0.7046358585357666, -0.5972654223442078, -0.4898949861526489, -0.3825245499610901, -0.27515435218811035, -0.1677839159965515, -0.060413479804992676, 0.04695695638656616, 0.154327392578125, 0.26169782876968384, 0.3690682649612427, 0.4764387011528015, 0.5838091373443604, 0.6911795735359192, 0.798550009727478, 0.9059204459190369, 1.0132908821105957, 1.1206612586975098, 1.2280317544937134, 1.335402250289917, 1.442772626876831, 1.5501430034637451, 1.6575134992599487, 1.7648839950561523, 1.8722543716430664, 1.9796247482299805, 2.0869951248168945, 2.1943657398223877, 2.3017361164093018, 2.409106492996216, 2.516477108001709, 2.623847484588623, 2.731217861175537, 2.838588237762451, 2.9459586143493652, 3.0533292293548584, 3.1606996059417725]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 2.0, 2.0, 5.0, 9.0, 1.0, 10.0, 16.0, 11.0, 20.0, 22.0, 52.0, 64.0, 112.0, 259.0, 510.0, 1177.0, 3263.0, 11252.0, 47641.0, 180398.0, 631313.0, 1818733.0, 1076307.0, 305101.0, 82868.0, 23987.0, 7322.0, 2316.0, 778.0, 337.0, 145.0, 81.0, 52.0, 36.0, 22.0, 15.0, 6.0, 13.0, 6.0, 5.0, 5.0, 6.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.49609375, -4.37689208984375, -4.2576904296875, -4.13848876953125, -4.019287109375, -3.90008544921875, -3.7808837890625, -3.66168212890625, -3.54248046875, -3.42327880859375, -3.3040771484375, -3.18487548828125, -3.065673828125, -2.94647216796875, -2.8272705078125, -2.70806884765625, -2.5888671875, -2.46966552734375, -2.3504638671875, -2.23126220703125, -2.112060546875, -1.99285888671875, -1.8736572265625, -1.75445556640625, -1.63525390625, -1.51605224609375, -1.3968505859375, -1.27764892578125, -1.158447265625, -1.03924560546875, -0.9200439453125, -0.80084228515625, -0.681640625, -0.56243896484375, -0.4432373046875, -0.32403564453125, -0.204833984375, -0.08563232421875, 0.0335693359375, 0.15277099609375, 0.27197265625, 0.39117431640625, 0.5103759765625, 0.62957763671875, 0.748779296875, 0.86798095703125, 0.9871826171875, 1.10638427734375, 1.2255859375, 1.34478759765625, 1.4639892578125, 1.58319091796875, 1.702392578125, 1.82159423828125, 1.9407958984375, 2.05999755859375, 2.17919921875, 2.29840087890625, 2.4176025390625, 2.53680419921875, 2.656005859375, 2.77520751953125, 2.8944091796875, 3.01361083984375, 3.1328125]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 2.0, 4.0, 5.0, 1.0, 3.0, 10.0, 9.0, 16.0, 15.0, 20.0, 28.0, 27.0, 28.0, 35.0, 43.0, 49.0, 48.0, 49.0, 42.0, 47.0, 46.0, 41.0, 46.0, 55.0, 45.0, 33.0, 39.0, 33.0, 27.0, 26.0, 22.0, 24.0, 12.0, 13.0, 13.0, 5.0, 7.0, 6.0, 7.0, 5.0, 7.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-4.94140625, -4.809234619140625, -4.67706298828125, -4.544891357421875, -4.4127197265625, -4.280548095703125, -4.14837646484375, -4.016204833984375, -3.884033203125, -3.751861572265625, -3.61968994140625, -3.487518310546875, -3.3553466796875, -3.223175048828125, -3.09100341796875, -2.958831787109375, -2.82666015625, -2.694488525390625, -2.56231689453125, -2.430145263671875, -2.2979736328125, -2.165802001953125, -2.03363037109375, -1.901458740234375, -1.769287109375, -1.637115478515625, -1.50494384765625, -1.372772216796875, -1.2406005859375, -1.108428955078125, -0.97625732421875, -0.844085693359375, -0.7119140625, -0.579742431640625, -0.44757080078125, -0.315399169921875, -0.1832275390625, -0.051055908203125, 0.08111572265625, 0.213287353515625, 0.345458984375, 0.477630615234375, 0.60980224609375, 0.741973876953125, 0.8741455078125, 1.006317138671875, 1.13848876953125, 1.270660400390625, 1.40283203125, 1.535003662109375, 1.66717529296875, 1.799346923828125, 1.9315185546875, 2.063690185546875, 2.19586181640625, 2.328033447265625, 2.460205078125, 2.592376708984375, 2.72454833984375, 2.856719970703125, 2.9888916015625, 3.121063232421875, 3.25323486328125, 3.385406494140625, 3.517578125]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 5.0, 11.0, 15.0, 21.0, 43.0, 67.0, 155.0, 385.0, 2110.0, 4190160.0, 847.0, 243.0, 114.0, 46.0, 26.0, 11.0, 11.0, 5.0, 4.0, 0.0, 1.0, 1.0, 0.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-101.6875, -98.4404296875, -95.193359375, -91.9462890625, -88.69921875, -85.4521484375, -82.205078125, -78.9580078125, -75.7109375, -72.4638671875, -69.216796875, -65.9697265625, -62.72265625, -59.4755859375, -56.228515625, -52.9814453125, -49.734375, -46.4873046875, -43.240234375, -39.9931640625, -36.74609375, -33.4990234375, -30.251953125, -27.0048828125, -23.7578125, -20.5107421875, -17.263671875, -14.0166015625, -10.76953125, -7.5224609375, -4.275390625, -1.0283203125, 2.21875, 5.4658203125, 8.712890625, 11.9599609375, 15.20703125, 18.4541015625, 21.701171875, 24.9482421875, 28.1953125, 31.4423828125, 34.689453125, 37.9365234375, 41.18359375, 44.4306640625, 47.677734375, 50.9248046875, 54.171875, 57.4189453125, 60.666015625, 63.9130859375, 67.16015625, 70.4072265625, 73.654296875, 76.9013671875, 80.1484375, 83.3955078125, 86.642578125, 89.8896484375, 93.13671875, 96.3837890625, 99.630859375, 102.8779296875, 106.125]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 5.0, 10.0, 12.0, 20.0, 32.0, 51.0, 103.0, 248.0, 541.0, 1258.0, 1025.0, 407.0, 170.0, 94.0, 44.0, 28.0, 8.0, 3.0, 10.0, 2.0, 3.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5703125, -2.4842529296875, -2.398193359375, -2.3121337890625, -2.22607421875, -2.1400146484375, -2.053955078125, -1.9678955078125, -1.8818359375, -1.7957763671875, -1.709716796875, -1.6236572265625, -1.53759765625, -1.4515380859375, -1.365478515625, -1.2794189453125, -1.193359375, -1.1072998046875, -1.021240234375, -0.9351806640625, -0.84912109375, -0.7630615234375, -0.677001953125, -0.5909423828125, -0.5048828125, -0.4188232421875, -0.332763671875, -0.2467041015625, -0.16064453125, -0.0745849609375, 0.011474609375, 0.0975341796875, 0.18359375, 0.2696533203125, 0.355712890625, 0.4417724609375, 0.52783203125, 0.6138916015625, 0.699951171875, 0.7860107421875, 0.8720703125, 0.9581298828125, 1.044189453125, 1.1302490234375, 1.21630859375, 1.3023681640625, 1.388427734375, 1.4744873046875, 1.560546875, 1.6466064453125, 1.732666015625, 1.8187255859375, 1.90478515625, 1.9908447265625, 2.076904296875, 2.1629638671875, 2.2490234375, 2.3350830078125, 2.421142578125, 2.5072021484375, 2.59326171875, 2.6793212890625, 2.765380859375, 2.8514404296875, 2.9375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 5.0, 6.0, 10.0, 15.0, 20.0, 49.0, 87.0, 101.0, 141.0, 142.0, 143.0, 92.0, 79.0, 47.0, 31.0, 26.0, 7.0, 10.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0130157470703125, -4.75441312789917, -4.495810508728027, -4.237207889556885, -3.9786055088043213, -3.7200028896331787, -3.4614005088806152, -3.2027978897094727, -2.94419527053833, -2.6855926513671875, -2.426990032196045, -2.1683876514434814, -1.9097850322723389, -1.6511824131011963, -1.3925799131393433, -1.1339774131774902, -0.8753747940063477, -0.6167722344398499, -0.35816967487335205, -0.09956711530685425, 0.15903544425964355, 0.41763806343078613, 0.6762405633926392, 0.9348430633544922, 1.1934456825256348, 1.4520483016967773, 1.7106508016586304, 1.9692533016204834, 2.227855920791626, 2.4864585399627686, 2.745060920715332, 3.0036635398864746, 3.2622671127319336, 3.520869731903076, 3.7794723510742188, 4.038074970245361, 4.296677589416504, 4.555279731750488, 4.813882350921631, 5.072484970092773, 5.331087589263916, 5.589690208435059, 5.848292827606201, 6.106895446777344, 6.365497589111328, 6.624100685119629, 6.882702827453613, 7.141305446624756, 7.399908065795898, 7.658510684967041, 7.917113304138184, 8.175715446472168, 8.434318542480469, 8.692920684814453, 8.951523780822754, 9.210125923156738, 9.468729019165039, 9.727331161499023, 9.985934257507324, 10.244536399841309, 10.50313949584961, 10.761741638183594, 11.020344734191895, 11.278946876525879, 11.537549018859863]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 5.0, 5.0, 5.0, 8.0, 7.0, 10.0, 6.0, 14.0, 19.0, 16.0, 20.0, 21.0, 27.0, 38.0, 40.0, 30.0, 41.0, 43.0, 47.0, 52.0, 46.0, 44.0, 41.0, 44.0, 35.0, 39.0, 31.0, 38.0, 28.0, 38.0, 28.0, 24.0, 20.0, 23.0, 18.0, 10.0, 14.0, 8.0, 7.0, 3.0, 3.0, 6.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.213425636291504, -4.086343765258789, -3.9592621326446533, -3.8321802616119385, -3.7050983905792236, -3.578016757965088, -3.450934886932373, -3.323853015899658, -3.1967711448669434, -3.0696892738342285, -2.9426076412200928, -2.815525770187378, -2.688443899154663, -2.5613622665405273, -2.4342803955078125, -2.3071985244750977, -2.180116891860962, -2.053035020828247, -1.9259532690048218, -1.7988715171813965, -1.6717896461486816, -1.5447078943252563, -1.417626142501831, -1.2905442714691162, -1.163462519645691, -1.0363807678222656, -0.9092988967895508, -0.7822171449661255, -0.6551353335380554, -0.5280535221099854, -0.40097177028656006, -0.27388995885849, -0.14680814743041992, -0.019726350903511047, 0.10735544562339783, 0.2344372272491455, 0.3615190386772156, 0.48860085010528564, 0.6156826019287109, 0.742764413356781, 0.8698462247848511, 0.9969280362129211, 1.1240098476409912, 1.2510915994644165, 1.3781733512878418, 1.5052552223205566, 1.632336974143982, 1.7594187259674072, 1.886500597000122, 2.013582468032837, 2.1406641006469727, 2.2677459716796875, 2.3948278427124023, 2.521909713745117, 2.648991346359253, 2.7760732173919678, 2.9031548500061035, 3.0302367210388184, 3.157318353652954, 3.284400224685669, 3.411482095718384, 3.5385637283325195, 3.6656455993652344, 3.792727470397949, 3.919809341430664]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 9.0, 5.0, 11.0, 15.0, 26.0, 51.0, 67.0, 101.0, 156.0, 322.0, 515.0, 987.0, 2133.0, 4654.0, 11486.0, 30369.0, 84769.0, 211614.0, 327194.0, 225498.0, 93197.0, 33448.0, 12276.0, 5011.0, 2183.0, 1085.0, 554.0, 294.0, 208.0, 128.0, 58.0, 44.0, 31.0, 17.0, 14.0, 8.0, 5.0, 6.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2734375, -1.236572265625, -1.19970703125, -1.162841796875, -1.1259765625, -1.089111328125, -1.05224609375, -1.015380859375, -0.978515625, -0.941650390625, -0.90478515625, -0.867919921875, -0.8310546875, -0.794189453125, -0.75732421875, -0.720458984375, -0.68359375, -0.646728515625, -0.60986328125, -0.572998046875, -0.5361328125, -0.499267578125, -0.46240234375, -0.425537109375, -0.388671875, -0.351806640625, -0.31494140625, -0.278076171875, -0.2412109375, -0.204345703125, -0.16748046875, -0.130615234375, -0.09375, -0.056884765625, -0.02001953125, 0.016845703125, 0.0537109375, 0.090576171875, 0.12744140625, 0.164306640625, 0.201171875, 0.238037109375, 0.27490234375, 0.311767578125, 0.3486328125, 0.385498046875, 0.42236328125, 0.459228515625, 0.49609375, 0.532958984375, 0.56982421875, 0.606689453125, 0.6435546875, 0.680419921875, 0.71728515625, 0.754150390625, 0.791015625, 0.827880859375, 0.86474609375, 0.901611328125, 0.9384765625, 0.975341796875, 1.01220703125, 1.049072265625, 1.0859375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 3.0, 4.0, 6.0, 10.0, 11.0, 5.0, 17.0, 19.0, 31.0, 19.0, 34.0, 35.0, 41.0, 49.0, 50.0, 56.0, 46.0, 52.0, 57.0, 48.0, 54.0, 41.0, 46.0, 47.0, 28.0, 30.0, 32.0, 33.0, 31.0, 23.0, 9.0, 6.0, 5.0, 5.0, 7.0, 3.0, 5.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.48828125, -3.36920166015625, -3.2501220703125, -3.13104248046875, -3.011962890625, -2.89288330078125, -2.7738037109375, -2.65472412109375, -2.53564453125, -2.41656494140625, -2.2974853515625, -2.17840576171875, -2.059326171875, -1.94024658203125, -1.8211669921875, -1.70208740234375, -1.5830078125, -1.46392822265625, -1.3448486328125, -1.22576904296875, -1.106689453125, -0.98760986328125, -0.8685302734375, -0.74945068359375, -0.63037109375, -0.51129150390625, -0.3922119140625, -0.27313232421875, -0.154052734375, -0.03497314453125, 0.0841064453125, 0.20318603515625, 0.322265625, 0.44134521484375, 0.5604248046875, 0.67950439453125, 0.798583984375, 0.91766357421875, 1.0367431640625, 1.15582275390625, 1.27490234375, 1.39398193359375, 1.5130615234375, 1.63214111328125, 1.751220703125, 1.87030029296875, 1.9893798828125, 2.10845947265625, 2.2275390625, 2.34661865234375, 2.4656982421875, 2.58477783203125, 2.703857421875, 2.82293701171875, 2.9420166015625, 3.06109619140625, 3.18017578125, 3.29925537109375, 3.4183349609375, 3.53741455078125, 3.656494140625, 3.77557373046875, 3.8946533203125, 4.01373291015625, 4.1328125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 8.0, 6.0, 3.0, 19.0, 19.0, 42.0, 61.0, 101.0, 180.0, 251.0, 373.0, 717.0, 1229.0, 2344.0, 4573.0, 8816.0, 18243.0, 37369.0, 75220.0, 138485.0, 209258.0, 220547.0, 156528.0, 87709.0, 43818.0, 21162.0, 10191.0, 5267.0, 2624.0, 1500.0, 787.0, 414.0, 254.0, 167.0, 85.0, 60.0, 44.0, 25.0, 16.0, 16.0, 10.0, 4.0, 6.0, 2.0, 4.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.5859375, -0.5682449340820312, -0.5505523681640625, -0.5328598022460938, -0.515167236328125, -0.49747467041015625, -0.4797821044921875, -0.46208953857421875, -0.44439697265625, -0.42670440673828125, -0.4090118408203125, -0.39131927490234375, -0.373626708984375, -0.35593414306640625, -0.3382415771484375, -0.32054901123046875, -0.3028564453125, -0.28516387939453125, -0.2674713134765625, -0.24977874755859375, -0.232086181640625, -0.21439361572265625, -0.1967010498046875, -0.17900848388671875, -0.16131591796875, -0.14362335205078125, -0.1259307861328125, -0.10823822021484375, -0.090545654296875, -0.07285308837890625, -0.0551605224609375, -0.03746795654296875, -0.019775390625, -0.00208282470703125, 0.0156097412109375, 0.03330230712890625, 0.050994873046875, 0.06868743896484375, 0.0863800048828125, 0.10407257080078125, 0.12176513671875, 0.13945770263671875, 0.1571502685546875, 0.17484283447265625, 0.192535400390625, 0.21022796630859375, 0.2279205322265625, 0.24561309814453125, 0.2633056640625, 0.28099822998046875, 0.2986907958984375, 0.31638336181640625, 0.334075927734375, 0.35176849365234375, 0.3694610595703125, 0.38715362548828125, 0.40484619140625, 0.42253875732421875, 0.4402313232421875, 0.45792388916015625, 0.475616455078125, 0.49330902099609375, 0.5110015869140625, 0.5286941528320312, 0.54638671875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 4.0, 2.0, 4.0, 0.0, 6.0, 7.0, 7.0, 19.0, 13.0, 17.0, 22.0, 25.0, 26.0, 35.0, 32.0, 39.0, 39.0, 34.0, 46.0, 45.0, 53.0, 47.0, 47.0, 43.0, 50.0, 44.0, 36.0, 48.0, 27.0, 31.0, 21.0, 28.0, 29.0, 19.0, 14.0, 8.0, 10.0, 8.0, 3.0, 3.0, 5.0, 1.0, 3.0, 2.0, 1.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.23828125, -6.03662109375, -5.8349609375, -5.63330078125, -5.431640625, -5.22998046875, -5.0283203125, -4.82666015625, -4.625, -4.42333984375, -4.2216796875, -4.02001953125, -3.818359375, -3.61669921875, -3.4150390625, -3.21337890625, -3.01171875, -2.81005859375, -2.6083984375, -2.40673828125, -2.205078125, -2.00341796875, -1.8017578125, -1.60009765625, -1.3984375, -1.19677734375, -0.9951171875, -0.79345703125, -0.591796875, -0.39013671875, -0.1884765625, 0.01318359375, 0.21484375, 0.41650390625, 0.6181640625, 0.81982421875, 1.021484375, 1.22314453125, 1.4248046875, 1.62646484375, 1.828125, 2.02978515625, 2.2314453125, 2.43310546875, 2.634765625, 2.83642578125, 3.0380859375, 3.23974609375, 3.44140625, 3.64306640625, 3.8447265625, 4.04638671875, 4.248046875, 4.44970703125, 4.6513671875, 4.85302734375, 5.0546875, 5.25634765625, 5.4580078125, 5.65966796875, 5.861328125, 6.06298828125, 6.2646484375, 6.46630859375, 6.66796875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 8.0, 5.0, 9.0, 13.0, 18.0, 30.0, 53.0, 92.0, 152.0, 257.0, 442.0, 776.0, 1500.0, 3213.0, 7931.0, 23571.0, 92976.0, 410322.0, 386160.0, 85067.0, 22104.0, 7520.0, 2992.0, 1526.0, 740.0, 448.0, 257.0, 136.0, 86.0, 46.0, 40.0, 27.0, 13.0, 11.0, 4.0, 7.0, 4.0, 4.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1925048828125, -0.18700027465820312, -0.18149566650390625, -0.17599105834960938, -0.1704864501953125, -0.16498184204101562, -0.15947723388671875, -0.15397262573242188, -0.148468017578125, -0.14296340942382812, -0.13745880126953125, -0.13195419311523438, -0.1264495849609375, -0.12094497680664062, -0.11544036865234375, -0.10993576049804688, -0.10443115234375, -0.09892654418945312, -0.09342193603515625, -0.08791732788085938, -0.0824127197265625, -0.07690811157226562, -0.07140350341796875, -0.06589889526367188, -0.060394287109375, -0.054889678955078125, -0.04938507080078125, -0.043880462646484375, -0.0383758544921875, -0.032871246337890625, -0.02736663818359375, -0.021862030029296875, -0.016357421875, -0.010852813720703125, -0.00534820556640625, 0.000156402587890625, 0.0056610107421875, 0.011165618896484375, 0.01667022705078125, 0.022174835205078125, 0.027679443359375, 0.033184051513671875, 0.03868865966796875, 0.044193267822265625, 0.0496978759765625, 0.055202484130859375, 0.06070709228515625, 0.06621170043945312, 0.07171630859375, 0.07722091674804688, 0.08272552490234375, 0.08823013305664062, 0.0937347412109375, 0.09923934936523438, 0.10474395751953125, 0.11024856567382812, 0.115753173828125, 0.12125778198242188, 0.12676239013671875, 0.13226699829101562, 0.1377716064453125, 0.14327621459960938, 0.14878082275390625, 0.15428543090820312, 0.1597900390625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 7.0, 2.0, 3.0, 8.0, 7.0, 7.0, 14.0, 8.0, 16.0, 20.0, 32.0, 36.0, 46.0, 64.0, 65.0, 77.0, 77.0, 82.0, 78.0, 67.0, 51.0, 51.0, 34.0, 38.0, 22.0, 11.0, 11.0, 22.0, 7.0, 9.0, 3.0, 10.0, 4.0, 3.0, 2.0, 5.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-9.34600830078125e-05, -9.043421596288681e-05, -8.740834891796112e-05, -8.438248187303543e-05, -8.135661482810974e-05, -7.833074778318405e-05, -7.530488073825836e-05, -7.227901369333267e-05, -6.925314664840698e-05, -6.622727960348129e-05, -6.32014125585556e-05, -6.017554551362991e-05, -5.7149678468704224e-05, -5.4123811423778534e-05, -5.1097944378852844e-05, -4.8072077333927155e-05, -4.5046210289001465e-05, -4.2020343244075775e-05, -3.8994476199150085e-05, -3.5968609154224396e-05, -3.2942742109298706e-05, -2.9916875064373016e-05, -2.6891008019447327e-05, -2.3865140974521637e-05, -2.0839273929595947e-05, -1.7813406884670258e-05, -1.4787539839744568e-05, -1.1761672794818878e-05, -8.735805749893188e-06, -5.709938704967499e-06, -2.684071660041809e-06, 3.417953848838806e-07, 3.3676624298095703e-06, 6.39352947473526e-06, 9.41939651966095e-06, 1.244526356458664e-05, 1.547113060951233e-05, 1.849699765443802e-05, 2.152286469936371e-05, 2.4548731744289398e-05, 2.7574598789215088e-05, 3.060046583414078e-05, 3.362633287906647e-05, 3.665219992399216e-05, 3.967806696891785e-05, 4.2703934013843536e-05, 4.5729801058769226e-05, 4.8755668103694916e-05, 5.1781535148620605e-05, 5.4807402193546295e-05, 5.7833269238471985e-05, 6.0859136283397675e-05, 6.388500332832336e-05, 6.691087037324905e-05, 6.993673741817474e-05, 7.296260446310043e-05, 7.598847150802612e-05, 7.901433855295181e-05, 8.20402055978775e-05, 8.506607264280319e-05, 8.809193968772888e-05, 9.111780673265457e-05, 9.414367377758026e-05, 9.716954082250595e-05, 0.00010019540786743164]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 3.0, 9.0, 8.0, 9.0, 6.0, 7.0, 10.0, 11.0, 12.0, 11.0, 17.0, 31.0, 31.0, 47.0, 60.0, 99.0, 158.0, 294.0, 4471.0, 873077.0, 168055.0, 1404.0, 241.0, 144.0, 84.0, 48.0, 44.0, 23.0, 26.0, 21.0, 18.0, 10.0, 7.0, 8.0, 9.0, 6.0, 4.0, 6.0, 5.0, 3.0, 2.0, 6.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.94580078125, -0.9151382446289062, -0.8844757080078125, -0.8538131713867188, -0.823150634765625, -0.7924880981445312, -0.7618255615234375, -0.7311630249023438, -0.70050048828125, -0.6698379516601562, -0.6391754150390625, -0.6085128784179688, -0.577850341796875, -0.5471878051757812, -0.5165252685546875, -0.48586273193359375, -0.4552001953125, -0.42453765869140625, -0.3938751220703125, -0.36321258544921875, -0.332550048828125, -0.30188751220703125, -0.2712249755859375, -0.24056243896484375, -0.20989990234375, -0.17923736572265625, -0.1485748291015625, -0.11791229248046875, -0.087249755859375, -0.05658721923828125, -0.0259246826171875, 0.00473785400390625, 0.035400390625, 0.06606292724609375, 0.0967254638671875, 0.12738800048828125, 0.158050537109375, 0.18871307373046875, 0.2193756103515625, 0.25003814697265625, 0.28070068359375, 0.31136322021484375, 0.3420257568359375, 0.37268829345703125, 0.403350830078125, 0.43401336669921875, 0.4646759033203125, 0.49533843994140625, 0.5260009765625, 0.5566635131835938, 0.5873260498046875, 0.6179885864257812, 0.648651123046875, 0.6793136596679688, 0.7099761962890625, 0.7406387329101562, 0.77130126953125, 0.8019638061523438, 0.8326263427734375, 0.8632888793945312, 0.893951416015625, 0.9246139526367188, 0.9552764892578125, 0.9859390258789062, 1.0166015625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 4.0, 4.0, 6.0, 9.0, 8.0, 9.0, 11.0, 7.0, 8.0, 7.0, 15.0, 19.0, 18.0, 19.0, 32.0, 36.0, 43.0, 57.0, 67.0, 95.0, 82.0, 68.0, 74.0, 57.0, 42.0, 28.0, 25.0, 25.0, 15.0, 22.0, 19.0, 13.0, 10.0, 9.0, 7.0, 5.0, 5.0, 6.0, 7.0, 0.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.07611083984375, -0.07376575469970703, -0.07142066955566406, -0.0690755844116211, -0.06673049926757812, -0.06438541412353516, -0.06204032897949219, -0.05969524383544922, -0.05735015869140625, -0.05500507354736328, -0.05265998840332031, -0.050314903259277344, -0.047969818115234375, -0.045624732971191406, -0.04327964782714844, -0.04093456268310547, -0.0385894775390625, -0.03624439239501953, -0.03389930725097656, -0.031554222106933594, -0.029209136962890625, -0.026864051818847656, -0.024518966674804688, -0.02217388153076172, -0.01982879638671875, -0.01748371124267578, -0.015138626098632812, -0.012793540954589844, -0.010448455810546875, -0.008103370666503906, -0.0057582855224609375, -0.0034132003784179688, -0.001068115234375, 0.0012769699096679688, 0.0036220550537109375, 0.005967140197753906, 0.008312225341796875, 0.010657310485839844, 0.013002395629882812, 0.015347480773925781, 0.01769256591796875, 0.02003765106201172, 0.022382736206054688, 0.024727821350097656, 0.027072906494140625, 0.029417991638183594, 0.03176307678222656, 0.03410816192626953, 0.0364532470703125, 0.03879833221435547, 0.04114341735839844, 0.043488502502441406, 0.045833587646484375, 0.048178672790527344, 0.05052375793457031, 0.05286884307861328, 0.05521392822265625, 0.05755901336669922, 0.05990409851074219, 0.062249183654785156, 0.06459426879882812, 0.0669393539428711, 0.06928443908691406, 0.07162952423095703, 0.073974609375]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 7.0, 8.0, 19.0, 42.0, 91.0, 196.0, 249.0, 193.0, 96.0, 74.0, 24.0, 12.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.921342849731445, -11.595335960388184, -11.269329071044922, -10.943321228027344, -10.617314338684082, -10.29130744934082, -9.965299606323242, -9.63929271697998, -9.313285827636719, -8.987278938293457, -8.661272048950195, -8.335264205932617, -8.009257316589355, -7.683250427246094, -7.357243061065674, -7.031235694885254, -6.705228805541992, -6.3792219161987305, -6.0532145500183105, -5.727207183837891, -5.401200294494629, -5.075193405151367, -4.749186038970947, -4.423178672790527, -4.097171783447266, -3.771164655685425, -3.445157527923584, -3.119150400161743, -2.7931432723999023, -2.4671361446380615, -2.1411290168762207, -1.8151218891143799, -1.489114761352539, -1.1631076335906982, -0.8371005058288574, -0.5110933780670166, -0.18508625030517578, 0.14092087745666504, 0.46692800521850586, 0.7929351329803467, 1.1189422607421875, 1.4449493885040283, 1.7709565162658691, 2.09696364402771, 2.422970771789551, 2.7489778995513916, 3.0749850273132324, 3.4009921550750732, 3.726999282836914, 4.053006172180176, 4.379013538360596, 4.705020904541016, 5.031027793884277, 5.357034683227539, 5.683042049407959, 6.009049415588379, 6.335056304931641, 6.661063194274902, 6.987070560455322, 7.313077926635742, 7.639084815979004, 7.965091705322266, 8.291099548339844, 8.617106437683105, 8.943113327026367]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 5.0, 1.0, 8.0, 10.0, 6.0, 11.0, 11.0, 20.0, 14.0, 13.0, 26.0, 30.0, 36.0, 38.0, 36.0, 39.0, 48.0, 53.0, 53.0, 42.0, 44.0, 49.0, 49.0, 31.0, 49.0, 34.0, 34.0, 43.0, 26.0, 25.0, 18.0, 23.0, 19.0, 9.0, 11.0, 6.0, 11.0, 6.0, 5.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.1133792400360107, -3.0101258754730225, -2.9068727493286133, -2.803619384765625, -2.7003660202026367, -2.5971126556396484, -2.49385929107666, -2.390606164932251, -2.2873528003692627, -2.1840994358062744, -2.0808463096618652, -1.977592945098877, -1.8743395805358887, -1.7710862159729004, -1.6678329706192017, -1.564579725265503, -1.4613263607025146, -1.3580729961395264, -1.2548197507858276, -1.151566505432129, -1.0483131408691406, -0.9450598359107971, -0.8418065309524536, -0.7385532259941101, -0.6352999210357666, -0.5320466160774231, -0.4287933111190796, -0.3255400061607361, -0.22228670120239258, -0.11903339624404907, -0.015780091285705566, 0.08747321367263794, 0.19072651863098145, 0.29397982358932495, 0.39723312854766846, 0.500486433506012, 0.6037397384643555, 0.706993043422699, 0.8102463483810425, 0.913499653339386, 1.0167529582977295, 1.1200063228607178, 1.2232595682144165, 1.3265128135681152, 1.4297661781311035, 1.5330195426940918, 1.6362727880477905, 1.7395260334014893, 1.8427793979644775, 1.9460327625274658, 2.049285888671875, 2.1525392532348633, 2.2557926177978516, 2.35904598236084, 2.462299346923828, 2.5655524730682373, 2.6688058376312256, 2.772059202194214, 2.875312328338623, 2.9785656929016113, 3.0818190574645996, 3.185072422027588, 3.288325786590576, 3.3915789127349854, 3.4948322772979736]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 6.0, 5.0, 6.0, 8.0, 12.0, 13.0, 25.0, 21.0, 31.0, 56.0, 79.0, 123.0, 234.0, 394.0, 847.0, 1808.0, 4558.0, 15265.0, 97025.0, 707040.0, 187788.0, 22668.0, 6069.0, 2243.0, 1023.0, 525.0, 233.0, 142.0, 107.0, 65.0, 47.0, 27.0, 14.0, 13.0, 10.0, 8.0, 8.0, 7.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.93359375, -2.840850830078125, -2.74810791015625, -2.655364990234375, -2.5626220703125, -2.469879150390625, -2.37713623046875, -2.284393310546875, -2.191650390625, -2.098907470703125, -2.00616455078125, -1.913421630859375, -1.8206787109375, -1.727935791015625, -1.63519287109375, -1.542449951171875, -1.44970703125, -1.356964111328125, -1.26422119140625, -1.171478271484375, -1.0787353515625, -0.985992431640625, -0.89324951171875, -0.800506591796875, -0.707763671875, -0.615020751953125, -0.52227783203125, -0.429534912109375, -0.3367919921875, -0.244049072265625, -0.15130615234375, -0.058563232421875, 0.0341796875, 0.126922607421875, 0.21966552734375, 0.312408447265625, 0.4051513671875, 0.497894287109375, 0.59063720703125, 0.683380126953125, 0.776123046875, 0.868865966796875, 0.96160888671875, 1.054351806640625, 1.1470947265625, 1.239837646484375, 1.33258056640625, 1.425323486328125, 1.51806640625, 1.610809326171875, 1.70355224609375, 1.796295166015625, 1.8890380859375, 1.981781005859375, 2.07452392578125, 2.167266845703125, 2.260009765625, 2.352752685546875, 2.44549560546875, 2.538238525390625, 2.6309814453125, 2.723724365234375, 2.81646728515625, 2.909210205078125, 3.001953125]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 6.0, 5.0, 4.0, 11.0, 10.0, 13.0, 13.0, 21.0, 17.0, 27.0, 22.0, 29.0, 27.0, 23.0, 35.0, 30.0, 45.0, 46.0, 44.0, 48.0, 36.0, 35.0, 46.0, 41.0, 42.0, 46.0, 43.0, 25.0, 28.0, 28.0, 26.0, 27.0, 20.0, 14.0, 14.0, 12.0, 8.0, 8.0, 7.0, 5.0, 3.0, 3.0, 5.0, 2.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.48828125, -5.31494140625, -5.1416015625, -4.96826171875, -4.794921875, -4.62158203125, -4.4482421875, -4.27490234375, -4.1015625, -3.92822265625, -3.7548828125, -3.58154296875, -3.408203125, -3.23486328125, -3.0615234375, -2.88818359375, -2.71484375, -2.54150390625, -2.3681640625, -2.19482421875, -2.021484375, -1.84814453125, -1.6748046875, -1.50146484375, -1.328125, -1.15478515625, -0.9814453125, -0.80810546875, -0.634765625, -0.46142578125, -0.2880859375, -0.11474609375, 0.05859375, 0.23193359375, 0.4052734375, 0.57861328125, 0.751953125, 0.92529296875, 1.0986328125, 1.27197265625, 1.4453125, 1.61865234375, 1.7919921875, 1.96533203125, 2.138671875, 2.31201171875, 2.4853515625, 2.65869140625, 2.83203125, 3.00537109375, 3.1787109375, 3.35205078125, 3.525390625, 3.69873046875, 3.8720703125, 4.04541015625, 4.21875, 4.39208984375, 4.5654296875, 4.73876953125, 4.912109375, 5.08544921875, 5.2587890625, 5.43212890625, 5.60546875]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 8.0, 9.0, 7.0, 21.0, 23.0, 63.0, 139.0, 523.0, 7468.0, 1034318.0, 5264.0, 424.0, 133.0, 61.0, 30.0, 16.0, 13.0, 9.0, 6.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.0078125, -13.4107666015625, -12.813720703125, -12.2166748046875, -11.61962890625, -11.0225830078125, -10.425537109375, -9.8284912109375, -9.2314453125, -8.6343994140625, -8.037353515625, -7.4403076171875, -6.84326171875, -6.2462158203125, -5.649169921875, -5.0521240234375, -4.455078125, -3.8580322265625, -3.260986328125, -2.6639404296875, -2.06689453125, -1.4698486328125, -0.872802734375, -0.2757568359375, 0.3212890625, 0.9183349609375, 1.515380859375, 2.1124267578125, 2.70947265625, 3.3065185546875, 3.903564453125, 4.5006103515625, 5.09765625, 5.6947021484375, 6.291748046875, 6.8887939453125, 7.48583984375, 8.0828857421875, 8.679931640625, 9.2769775390625, 9.8740234375, 10.4710693359375, 11.068115234375, 11.6651611328125, 12.26220703125, 12.8592529296875, 13.456298828125, 14.0533447265625, 14.650390625, 15.2474365234375, 15.844482421875, 16.4415283203125, 17.03857421875, 17.6356201171875, 18.232666015625, 18.8297119140625, 19.4267578125, 20.0238037109375, 20.620849609375, 21.2178955078125, 21.81494140625, 22.4119873046875, 23.009033203125, 23.6060791015625, 24.203125]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 5.0, 2.0, 1.0, 10.0, 3.0, 7.0, 8.0, 12.0, 15.0, 24.0, 25.0, 25.0, 24.0, 29.0, 41.0, 34.0, 40.0, 40.0, 40.0, 45.0, 53.0, 54.0, 51.0, 39.0, 43.0, 35.0, 38.0, 41.0, 26.0, 26.0, 25.0, 25.0, 17.0, 24.0, 19.0, 9.0, 10.0, 10.0, 9.0, 7.0, 7.0, 5.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.89453125, -4.72100830078125, -4.5474853515625, -4.37396240234375, -4.200439453125, -4.02691650390625, -3.8533935546875, -3.67987060546875, -3.50634765625, -3.33282470703125, -3.1593017578125, -2.98577880859375, -2.812255859375, -2.63873291015625, -2.4652099609375, -2.29168701171875, -2.1181640625, -1.94464111328125, -1.7711181640625, -1.59759521484375, -1.424072265625, -1.25054931640625, -1.0770263671875, -0.90350341796875, -0.72998046875, -0.55645751953125, -0.3829345703125, -0.20941162109375, -0.035888671875, 0.13763427734375, 0.3111572265625, 0.48468017578125, 0.658203125, 0.83172607421875, 1.0052490234375, 1.17877197265625, 1.352294921875, 1.52581787109375, 1.6993408203125, 1.87286376953125, 2.04638671875, 2.21990966796875, 2.3934326171875, 2.56695556640625, 2.740478515625, 2.91400146484375, 3.0875244140625, 3.26104736328125, 3.4345703125, 3.60809326171875, 3.7816162109375, 3.95513916015625, 4.128662109375, 4.30218505859375, 4.4757080078125, 4.64923095703125, 4.82275390625, 4.99627685546875, 5.1697998046875, 5.34332275390625, 5.516845703125, 5.69036865234375, 5.8638916015625, 6.03741455078125, 6.2109375]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 3.0, 8.0, 6.0, 13.0, 14.0, 51.0, 130.0, 1821.0, 1044201.0, 2087.0, 134.0, 48.0, 12.0, 11.0, 8.0, 5.0, 3.0, 1.0, 3.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-52.59375, -51.38525390625, -50.1767578125, -48.96826171875, -47.759765625, -46.55126953125, -45.3427734375, -44.13427734375, -42.92578125, -41.71728515625, -40.5087890625, -39.30029296875, -38.091796875, -36.88330078125, -35.6748046875, -34.46630859375, -33.2578125, -32.04931640625, -30.8408203125, -29.63232421875, -28.423828125, -27.21533203125, -26.0068359375, -24.79833984375, -23.58984375, -22.38134765625, -21.1728515625, -19.96435546875, -18.755859375, -17.54736328125, -16.3388671875, -15.13037109375, -13.921875, -12.71337890625, -11.5048828125, -10.29638671875, -9.087890625, -7.87939453125, -6.6708984375, -5.46240234375, -4.25390625, -3.04541015625, -1.8369140625, -0.62841796875, 0.580078125, 1.78857421875, 2.9970703125, 4.20556640625, 5.4140625, 6.62255859375, 7.8310546875, 9.03955078125, 10.248046875, 11.45654296875, 12.6650390625, 13.87353515625, 15.08203125, 16.29052734375, 17.4990234375, 18.70751953125, 19.916015625, 21.12451171875, 22.3330078125, 23.54150390625, 24.75]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 3.0, 2.0, 5.0, 8.0, 30.0, 87.0, 374.0, 359.0, 85.0, 24.0, 12.0, 4.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.0005326271057128906, -0.0005186013877391815, -0.0005045756697654724, -0.0004905499517917633, -0.0004765242338180542, -0.0004624985158443451, -0.000448472797870636, -0.0004344470798969269, -0.0004204213619232178, -0.00040639564394950867, -0.00039236992597579956, -0.00037834420800209045, -0.00036431849002838135, -0.00035029277205467224, -0.00033626705408096313, -0.00032224133610725403, -0.0003082156181335449, -0.0002941899001598358, -0.0002801641821861267, -0.0002661384642124176, -0.0002521127462387085, -0.0002380870282649994, -0.00022406131029129028, -0.00021003559231758118, -0.00019600987434387207, -0.00018198415637016296, -0.00016795843839645386, -0.00015393272042274475, -0.00013990700244903564, -0.00012588128447532654, -0.00011185556650161743, -9.782984852790833e-05, -8.380413055419922e-05, -6.977841258049011e-05, -5.5752694606781006e-05, -4.17269766330719e-05, -2.7701258659362793e-05, -1.3675540685653687e-05, 3.501772880554199e-07, 1.4375895261764526e-05, 2.8401613235473633e-05, 4.242733120918274e-05, 5.6453049182891846e-05, 7.047876715660095e-05, 8.450448513031006e-05, 9.853020310401917e-05, 0.00011255592107772827, 0.00012658163905143738, 0.00014060735702514648, 0.0001546330749988556, 0.0001686587929725647, 0.0001826845109462738, 0.0001967102289199829, 0.00021073594689369202, 0.00022476166486740112, 0.00023878738284111023, 0.00025281310081481934, 0.00026683881878852844, 0.00028086453676223755, 0.00029489025473594666, 0.00030891597270965576, 0.00032294169068336487, 0.000336967408657074, 0.0003509931266307831, 0.0003650188446044922]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 2.0, 2.0, 3.0, 8.0, 10.0, 18.0, 26.0, 50.0, 79.0, 187.0, 553.0, 3899.0, 160926.0, 871772.0, 9569.0, 969.0, 208.0, 113.0, 41.0, 47.0, 18.0, 15.0, 8.0, 8.0, 7.0, 1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.9140625, -2.8415069580078125, -2.768951416015625, -2.6963958740234375, -2.62384033203125, -2.5512847900390625, -2.478729248046875, -2.4061737060546875, -2.3336181640625, -2.2610626220703125, -2.188507080078125, -2.1159515380859375, -2.04339599609375, -1.9708404541015625, -1.898284912109375, -1.8257293701171875, -1.753173828125, -1.6806182861328125, -1.608062744140625, -1.5355072021484375, -1.46295166015625, -1.3903961181640625, -1.317840576171875, -1.2452850341796875, -1.1727294921875, -1.1001739501953125, -1.027618408203125, -0.9550628662109375, -0.88250732421875, -0.8099517822265625, -0.737396240234375, -0.6648406982421875, -0.59228515625, -0.5197296142578125, -0.447174072265625, -0.3746185302734375, -0.30206298828125, -0.2295074462890625, -0.156951904296875, -0.0843963623046875, -0.0118408203125, 0.0607147216796875, 0.133270263671875, 0.2058258056640625, 0.27838134765625, 0.3509368896484375, 0.423492431640625, 0.4960479736328125, 0.568603515625, 0.6411590576171875, 0.713714599609375, 0.7862701416015625, 0.85882568359375, 0.9313812255859375, 1.003936767578125, 1.0764923095703125, 1.1490478515625, 1.2216033935546875, 1.294158935546875, 1.3667144775390625, 1.43927001953125, 1.5118255615234375, 1.584381103515625, 1.6569366455078125, 1.7294921875]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 1.0, 1.0, 1.0, 4.0, 7.0, 2.0, 7.0, 14.0, 24.0, 39.0, 52.0, 86.0, 101.0, 165.0, 156.0, 102.0, 71.0, 52.0, 29.0, 28.0, 15.0, 9.0, 7.0, 4.0, 5.0, 6.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.470947265625, -0.4591102600097656, -0.44727325439453125, -0.4354362487792969, -0.4235992431640625, -0.4117622375488281, -0.39992523193359375, -0.3880882263183594, -0.376251220703125, -0.3644142150878906, -0.35257720947265625, -0.3407402038574219, -0.3289031982421875, -0.3170661926269531, -0.30522918701171875, -0.2933921813964844, -0.28155517578125, -0.2697181701660156, -0.25788116455078125, -0.24604415893554688, -0.2342071533203125, -0.22237014770507812, -0.21053314208984375, -0.19869613647460938, -0.186859130859375, -0.17502212524414062, -0.16318511962890625, -0.15134811401367188, -0.1395111083984375, -0.12767410278320312, -0.11583709716796875, -0.10400009155273438, -0.0921630859375, -0.08032608032226562, -0.06848907470703125, -0.056652069091796875, -0.0448150634765625, -0.032978057861328125, -0.02114105224609375, -0.009304046630859375, 0.002532958984375, 0.014369964599609375, 0.02620697021484375, 0.038043975830078125, 0.0498809814453125, 0.061717987060546875, 0.07355499267578125, 0.08539199829101562, 0.09722900390625, 0.10906600952148438, 0.12090301513671875, 0.13274002075195312, 0.1445770263671875, 0.15641403198242188, 0.16825103759765625, 0.18008804321289062, 0.191925048828125, 0.20376205444335938, 0.21559906005859375, 0.22743606567382812, 0.2392730712890625, 0.2511100769042969, 0.26294708251953125, 0.2747840881347656, 0.28662109375]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 22.0, 962.0, 37.0], "bins": [-257.7974853515625, -253.67599487304688, -249.5544891357422, -245.43299865722656, -241.31150817871094, -237.19000244140625, -233.06851196289062, -228.947021484375, -224.82553100585938, -220.70404052734375, -216.58253479003906, -212.46104431152344, -208.3395538330078, -204.21804809570312, -200.0965576171875, -195.97506713867188, -191.8535614013672, -187.73207092285156, -183.61056518554688, -179.48907470703125, -175.36758422851562, -171.24609375, -167.1245880126953, -163.0030975341797, -158.881591796875, -154.76010131835938, -150.6385955810547, -146.51710510253906, -142.39561462402344, -138.27410888671875, -134.15261840820312, -130.0311279296875, -125.90962982177734, -121.78813171386719, -117.66664123535156, -113.5451431274414, -109.42364501953125, -105.30215454101562, -101.18065643310547, -97.05915832519531, -92.93766784667969, -88.81616973876953, -84.6946792602539, -80.57318115234375, -76.45169067382812, -72.33019256591797, -68.20869445800781, -64.08720397949219, -59.96570587158203, -55.84421157836914, -51.72271728515625, -47.601219177246094, -43.4797248840332, -39.35823059082031, -35.236732482910156, -31.115238189697266, -26.993743896484375, -22.872249603271484, -18.75075340270996, -14.629258155822754, -10.507762908935547, -6.386268615722656, -2.264772415161133, 1.8567237854003906, 5.978218078613281]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 2.0, 6.0, 2.0, 5.0, 1.0, 7.0, 9.0, 10.0, 15.0, 11.0, 16.0, 15.0, 24.0, 17.0, 23.0, 28.0, 27.0, 35.0, 36.0, 35.0, 29.0, 32.0, 35.0, 39.0, 41.0, 36.0, 45.0, 44.0, 34.0, 37.0, 33.0, 30.0, 31.0, 30.0, 27.0, 26.0, 26.0, 18.0, 16.0, 9.0, 11.0, 13.0, 5.0, 6.0, 10.0, 8.0, 6.0, 2.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-8.181455612182617, -7.926083087921143, -7.670711040496826, -7.415338516235352, -7.159965991973877, -6.904593467712402, -6.649221420288086, -6.393848896026611, -6.138476371765137, -5.883103847503662, -5.627731800079346, -5.372359275817871, -5.1169867515563965, -4.861614227294922, -4.6062421798706055, -4.350869655609131, -4.0954976081848145, -3.840125322341919, -3.5847527980804443, -3.329380512237549, -3.074007987976074, -2.8186357021331787, -2.563263416290283, -2.3078908920288086, -2.052518606185913, -1.797146201133728, -1.541773796081543, -1.2864015102386475, -1.0310291051864624, -0.7756567001342773, -0.5202844142913818, -0.2649120092391968, -0.009539604187011719, 0.24583277106285095, 0.5012051463127136, 0.7565774917602539, 1.011949896812439, 1.267322301864624, 1.5226945877075195, 1.7780669927597046, 2.0334393978118896, 2.288811683654785, 2.5441842079162598, 2.7995564937591553, 3.054928779602051, 3.3103013038635254, 3.565673589706421, 3.8210458755493164, 4.076418399810791, 4.331790924072266, 4.587162971496582, 4.842535495758057, 5.097908020019531, 5.353280067443848, 5.608652591705322, 5.864025115966797, 6.119397163391113, 6.374769687652588, 6.630141735076904, 6.885514259338379, 7.1408867835998535, 7.396259307861328, 7.6516313552856445, 7.907003879547119, 8.162376403808594]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 9.0, 5.0, 4.0, 10.0, 12.0, 14.0, 20.0, 23.0, 24.0, 25.0, 44.0, 78.0, 91.0, 135.0, 188.0, 333.0, 628.0, 1301.0, 3654.0, 11888.0, 58063.0, 401291.0, 1981412.0, 1450947.0, 233486.0, 36864.0, 8664.0, 2704.0, 1098.0, 486.0, 293.0, 178.0, 88.0, 60.0, 39.0, 23.0, 26.0, 12.0, 16.0, 11.0, 9.0, 9.0, 4.0, 3.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 3.0, 0.0, 3.0, 1.0], "bins": [-5.0, -4.84783935546875, -4.6956787109375, -4.54351806640625, -4.391357421875, -4.23919677734375, -4.0870361328125, -3.93487548828125, -3.78271484375, -3.63055419921875, -3.4783935546875, -3.32623291015625, -3.174072265625, -3.02191162109375, -2.8697509765625, -2.71759033203125, -2.5654296875, -2.41326904296875, -2.2611083984375, -2.10894775390625, -1.956787109375, -1.80462646484375, -1.6524658203125, -1.50030517578125, -1.34814453125, -1.19598388671875, -1.0438232421875, -0.89166259765625, -0.739501953125, -0.58734130859375, -0.4351806640625, -0.28302001953125, -0.130859375, 0.02130126953125, 0.1734619140625, 0.32562255859375, 0.477783203125, 0.62994384765625, 0.7821044921875, 0.93426513671875, 1.08642578125, 1.23858642578125, 1.3907470703125, 1.54290771484375, 1.695068359375, 1.84722900390625, 1.9993896484375, 2.15155029296875, 2.3037109375, 2.45587158203125, 2.6080322265625, 2.76019287109375, 2.912353515625, 3.06451416015625, 3.2166748046875, 3.36883544921875, 3.52099609375, 3.67315673828125, 3.8253173828125, 3.97747802734375, 4.129638671875, 4.28179931640625, 4.4339599609375, 4.58612060546875, 4.73828125]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 7.0, 4.0, 9.0, 11.0, 11.0, 9.0, 8.0, 23.0, 25.0, 23.0, 24.0, 43.0, 38.0, 48.0, 43.0, 51.0, 61.0, 56.0, 50.0, 64.0, 60.0, 36.0, 54.0, 48.0, 31.0, 26.0, 30.0, 24.0, 26.0, 14.0, 11.0, 9.0, 8.0, 6.0, 8.0, 5.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.513671875, -3.4078369140625, -3.302001953125, -3.1961669921875, -3.09033203125, -2.9844970703125, -2.878662109375, -2.7728271484375, -2.6669921875, -2.5611572265625, -2.455322265625, -2.3494873046875, -2.24365234375, -2.1378173828125, -2.031982421875, -1.9261474609375, -1.8203125, -1.7144775390625, -1.608642578125, -1.5028076171875, -1.39697265625, -1.2911376953125, -1.185302734375, -1.0794677734375, -0.9736328125, -0.8677978515625, -0.761962890625, -0.6561279296875, -0.55029296875, -0.4444580078125, -0.338623046875, -0.2327880859375, -0.126953125, -0.0211181640625, 0.084716796875, 0.1905517578125, 0.29638671875, 0.4022216796875, 0.508056640625, 0.6138916015625, 0.7197265625, 0.8255615234375, 0.931396484375, 1.0372314453125, 1.14306640625, 1.2489013671875, 1.354736328125, 1.4605712890625, 1.56640625, 1.6722412109375, 1.778076171875, 1.8839111328125, 1.98974609375, 2.0955810546875, 2.201416015625, 2.3072509765625, 2.4130859375, 2.5189208984375, 2.624755859375, 2.7305908203125, 2.83642578125, 2.9422607421875, 3.048095703125, 3.1539306640625, 3.259765625]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 5.0, 3.0, 7.0, 11.0, 13.0, 47.0, 130.0, 856.0, 4088763.0, 103864.0, 438.0, 85.0, 31.0, 13.0, 11.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.5625, -15.166015625, -13.76953125, -12.373046875, -10.9765625, -9.580078125, -8.18359375, -6.787109375, -5.390625, -3.994140625, -2.59765625, -1.201171875, 0.1953125, 1.591796875, 2.98828125, 4.384765625, 5.78125, 7.177734375, 8.57421875, 9.970703125, 11.3671875, 12.763671875, 14.16015625, 15.556640625, 16.953125, 18.349609375, 19.74609375, 21.142578125, 22.5390625, 23.935546875, 25.33203125, 26.728515625, 28.125, 29.521484375, 30.91796875, 32.314453125, 33.7109375, 35.107421875, 36.50390625, 37.900390625, 39.296875, 40.693359375, 42.08984375, 43.486328125, 44.8828125, 46.279296875, 47.67578125, 49.072265625, 50.46875, 51.865234375, 53.26171875, 54.658203125, 56.0546875, 57.451171875, 58.84765625, 60.244140625, 61.640625, 63.037109375, 64.43359375, 65.830078125, 67.2265625, 68.623046875, 70.01953125, 71.416015625, 72.8125]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 4.0, 4.0, 3.0, 3.0, 4.0, 4.0, 8.0, 6.0, 13.0, 15.0, 22.0, 29.0, 51.0, 45.0, 94.0, 138.0, 175.0, 271.0, 368.0, 535.0, 541.0, 508.0, 404.0, 250.0, 171.0, 119.0, 73.0, 59.0, 42.0, 26.0, 23.0, 21.0, 9.0, 10.0, 7.0, 3.0, 3.0, 8.0, 5.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.5595703125, -1.5128326416015625, -1.466094970703125, -1.4193572998046875, -1.37261962890625, -1.3258819580078125, -1.279144287109375, -1.2324066162109375, -1.1856689453125, -1.1389312744140625, -1.092193603515625, -1.0454559326171875, -0.99871826171875, -0.9519805908203125, -0.905242919921875, -0.8585052490234375, -0.811767578125, -0.7650299072265625, -0.718292236328125, -0.6715545654296875, -0.62481689453125, -0.5780792236328125, -0.531341552734375, -0.4846038818359375, -0.4378662109375, -0.3911285400390625, -0.344390869140625, -0.2976531982421875, -0.25091552734375, -0.2041778564453125, -0.157440185546875, -0.1107025146484375, -0.06396484375, -0.0172271728515625, 0.029510498046875, 0.0762481689453125, 0.12298583984375, 0.1697235107421875, 0.216461181640625, 0.2631988525390625, 0.3099365234375, 0.3566741943359375, 0.403411865234375, 0.4501495361328125, 0.49688720703125, 0.5436248779296875, 0.590362548828125, 0.6371002197265625, 0.683837890625, 0.7305755615234375, 0.777313232421875, 0.8240509033203125, 0.87078857421875, 0.9175262451171875, 0.964263916015625, 1.0110015869140625, 1.0577392578125, 1.1044769287109375, 1.151214599609375, 1.1979522705078125, 1.24468994140625, 1.2914276123046875, 1.338165283203125, 1.3849029541015625, 1.431640625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 9.0, 29.0, 47.0, 114.0, 208.0, 266.0, 164.0, 103.0, 47.0, 17.0, 5.0, 2.0, 2.0], "bins": [-23.95665740966797, -23.531173706054688, -23.105688095092773, -22.680204391479492, -22.254718780517578, -21.829235076904297, -21.403751373291016, -20.9782657623291, -20.55278205871582, -20.12729835510254, -19.701812744140625, -19.276329040527344, -18.85084342956543, -18.42535972595215, -17.999874114990234, -17.574390411376953, -17.14890480041504, -16.723421096801758, -16.297935485839844, -15.872451782226562, -15.446967124938965, -15.021482467651367, -14.59599781036377, -14.170513153076172, -13.74502944946289, -13.319544792175293, -12.894060134887695, -12.468576431274414, -12.043091773986816, -11.617607116699219, -11.192122459411621, -10.766637802124023, -10.341154098510742, -9.915669441223145, -9.490184783935547, -9.064701080322266, -8.639216423034668, -8.21373176574707, -7.788247108459473, -7.362762451171875, -6.937277793884277, -6.51179313659668, -6.08630895614624, -5.660824298858643, -5.235339641571045, -4.8098554611206055, -4.384370803833008, -3.95888614654541, -3.5334014892578125, -3.107917070388794, -2.6824324131011963, -2.2569479942321777, -1.8314634561538696, -1.4059789180755615, -0.980494499206543, -0.5550098419189453, -0.12952542304992676, 0.29595908522605896, 0.7214435935020447, 1.146928071975708, 1.5724126100540161, 1.9978971481323242, 2.4233815670013428, 2.8488662242889404, 3.274350643157959]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 3.0, 12.0, 11.0, 13.0, 10.0, 19.0, 22.0, 23.0, 29.0, 29.0, 35.0, 29.0, 31.0, 34.0, 38.0, 37.0, 53.0, 45.0, 36.0, 48.0, 45.0, 35.0, 39.0, 43.0, 41.0, 26.0, 33.0, 25.0, 38.0, 24.0, 22.0, 17.0, 16.0, 11.0, 9.0, 4.0, 8.0, 10.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-3.8913259506225586, -3.787609100341797, -3.683892011642456, -3.5801749229431152, -3.4764580726623535, -3.372741222381592, -3.269024133682251, -3.16530704498291, -3.0615901947021484, -2.9578733444213867, -2.854156255722046, -2.750439167022705, -2.6467223167419434, -2.5430054664611816, -2.439288377761841, -2.3355712890625, -2.2318544387817383, -2.1281375885009766, -2.0244204998016357, -1.9207035303115845, -1.8169865608215332, -1.713269591331482, -1.6095526218414307, -1.5058356523513794, -1.4021186828613281, -1.2984017133712769, -1.1946847438812256, -1.0909677743911743, -0.987250804901123, -0.8835338354110718, -0.7798168659210205, -0.6760998964309692, -0.5723831653594971, -0.4686661958694458, -0.36494922637939453, -0.26123225688934326, -0.157515287399292, -0.05379831790924072, 0.04991865158081055, 0.15363562107086182, 0.2573525905609131, 0.36106956005096436, 0.4647865295410156, 0.5685034990310669, 0.6722204685211182, 0.7759374380111694, 0.8796544075012207, 0.983371376991272, 1.0870883464813232, 1.1908053159713745, 1.2945222854614258, 1.398239254951477, 1.5019562244415283, 1.6056731939315796, 1.7093901634216309, 1.8131071329116821, 1.9168241024017334, 2.020541191101074, 2.124258041381836, 2.2279748916625977, 2.3316919803619385, 2.4354090690612793, 2.539125919342041, 2.6428427696228027, 2.7465598583221436]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 7.0, 6.0, 2.0, 4.0, 12.0, 14.0, 25.0, 44.0, 59.0, 101.0, 161.0, 240.0, 352.0, 594.0, 902.0, 1493.0, 3124.0, 7498.0, 21355.0, 71775.0, 234250.0, 401246.0, 209934.0, 62625.0, 19195.0, 6772.0, 2895.0, 1510.0, 882.0, 537.0, 327.0, 231.0, 145.0, 82.0, 45.0, 34.0, 27.0, 17.0, 7.0, 10.0, 6.0, 6.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8017578125, -0.7735748291015625, -0.745391845703125, -0.7172088623046875, -0.68902587890625, -0.6608428955078125, -0.632659912109375, -0.6044769287109375, -0.5762939453125, -0.5481109619140625, -0.519927978515625, -0.4917449951171875, -0.46356201171875, -0.4353790283203125, -0.407196044921875, -0.3790130615234375, -0.350830078125, -0.3226470947265625, -0.294464111328125, -0.2662811279296875, -0.23809814453125, -0.2099151611328125, -0.181732177734375, -0.1535491943359375, -0.1253662109375, -0.0971832275390625, -0.069000244140625, -0.0408172607421875, -0.01263427734375, 0.0155487060546875, 0.043731689453125, 0.0719146728515625, 0.10009765625, 0.1282806396484375, 0.156463623046875, 0.1846466064453125, 0.21282958984375, 0.2410125732421875, 0.269195556640625, 0.2973785400390625, 0.3255615234375, 0.3537445068359375, 0.381927490234375, 0.4101104736328125, 0.43829345703125, 0.4664764404296875, 0.494659423828125, 0.5228424072265625, 0.551025390625, 0.5792083740234375, 0.607391357421875, 0.6355743408203125, 0.66375732421875, 0.6919403076171875, 0.720123291015625, 0.7483062744140625, 0.7764892578125, 0.8046722412109375, 0.832855224609375, 0.8610382080078125, 0.88922119140625, 0.9174041748046875, 0.945587158203125, 0.9737701416015625, 1.001953125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 1.0, 11.0, 9.0, 14.0, 21.0, 23.0, 18.0, 27.0, 14.0, 39.0, 46.0, 44.0, 35.0, 46.0, 58.0, 50.0, 55.0, 43.0, 34.0, 51.0, 39.0, 49.0, 49.0, 47.0, 34.0, 26.0, 27.0, 20.0, 22.0, 13.0, 15.0, 11.0, 3.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.4453125, -3.354278564453125, -3.26324462890625, -3.172210693359375, -3.0811767578125, -2.990142822265625, -2.89910888671875, -2.808074951171875, -2.717041015625, -2.626007080078125, -2.53497314453125, -2.443939208984375, -2.3529052734375, -2.261871337890625, -2.17083740234375, -2.079803466796875, -1.98876953125, -1.897735595703125, -1.80670166015625, -1.715667724609375, -1.6246337890625, -1.533599853515625, -1.44256591796875, -1.351531982421875, -1.260498046875, -1.169464111328125, -1.07843017578125, -0.987396240234375, -0.8963623046875, -0.805328369140625, -0.71429443359375, -0.623260498046875, -0.5322265625, -0.441192626953125, -0.35015869140625, -0.259124755859375, -0.1680908203125, -0.077056884765625, 0.01397705078125, 0.105010986328125, 0.196044921875, 0.287078857421875, 0.37811279296875, 0.469146728515625, 0.5601806640625, 0.651214599609375, 0.74224853515625, 0.833282470703125, 0.92431640625, 1.015350341796875, 1.10638427734375, 1.197418212890625, 1.2884521484375, 1.379486083984375, 1.47052001953125, 1.561553955078125, 1.652587890625, 1.743621826171875, 1.83465576171875, 1.925689697265625, 2.0167236328125, 2.107757568359375, 2.19879150390625, 2.289825439453125, 2.380859375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 7.0, 12.0, 10.0, 13.0, 17.0, 32.0, 43.0, 49.0, 100.0, 149.0, 234.0, 311.0, 494.0, 776.0, 1235.0, 1977.0, 2971.0, 4955.0, 7897.0, 13002.0, 21132.0, 34311.0, 55827.0, 85476.0, 121940.0, 152894.0, 157373.0, 130364.0, 92786.0, 61833.0, 38348.0, 23740.0, 14352.0, 9006.0, 5482.0, 3401.0, 2095.0, 1391.0, 901.0, 567.0, 367.0, 235.0, 144.0, 96.0, 64.0, 48.0, 31.0, 27.0, 15.0, 8.0, 5.0, 6.0, 7.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.228759765625, -0.22062301635742188, -0.21248626708984375, -0.20434951782226562, -0.1962127685546875, -0.18807601928710938, -0.17993927001953125, -0.17180252075195312, -0.163665771484375, -0.15552902221679688, -0.14739227294921875, -0.13925552368164062, -0.1311187744140625, -0.12298202514648438, -0.11484527587890625, -0.10670852661132812, -0.09857177734375, -0.09043502807617188, -0.08229827880859375, -0.07416152954101562, -0.0660247802734375, -0.057888031005859375, -0.04975128173828125, -0.041614532470703125, -0.033477783203125, -0.025341033935546875, -0.01720428466796875, -0.009067535400390625, -0.0009307861328125, 0.007205963134765625, 0.01534271240234375, 0.023479461669921875, 0.0316162109375, 0.039752960205078125, 0.04788970947265625, 0.056026458740234375, 0.0641632080078125, 0.07229995727539062, 0.08043670654296875, 0.08857345581054688, 0.096710205078125, 0.10484695434570312, 0.11298370361328125, 0.12112045288085938, 0.1292572021484375, 0.13739395141601562, 0.14553070068359375, 0.15366744995117188, 0.16180419921875, 0.16994094848632812, 0.17807769775390625, 0.18621444702148438, 0.1943511962890625, 0.20248794555664062, 0.21062469482421875, 0.21876144409179688, 0.226898193359375, 0.23503494262695312, 0.24317169189453125, 0.2513084411621094, 0.2594451904296875, 0.2675819396972656, 0.27571868896484375, 0.2838554382324219, 0.2919921875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 8.0, 5.0, 3.0, 7.0, 10.0, 10.0, 9.0, 14.0, 11.0, 22.0, 24.0, 28.0, 34.0, 38.0, 46.0, 30.0, 41.0, 38.0, 39.0, 37.0, 33.0, 39.0, 46.0, 31.0, 39.0, 38.0, 38.0, 31.0, 36.0, 27.0, 36.0, 20.0, 18.0, 19.0, 20.0, 12.0, 13.0, 13.0, 9.0, 5.0, 7.0, 8.0, 3.0, 3.0, 1.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3125, -4.1759033203125, -4.039306640625, -3.9027099609375, -3.76611328125, -3.6295166015625, -3.492919921875, -3.3563232421875, -3.2197265625, -3.0831298828125, -2.946533203125, -2.8099365234375, -2.67333984375, -2.5367431640625, -2.400146484375, -2.2635498046875, -2.126953125, -1.9903564453125, -1.853759765625, -1.7171630859375, -1.58056640625, -1.4439697265625, -1.307373046875, -1.1707763671875, -1.0341796875, -0.8975830078125, -0.760986328125, -0.6243896484375, -0.48779296875, -0.3511962890625, -0.214599609375, -0.0780029296875, 0.05859375, 0.1951904296875, 0.331787109375, 0.4683837890625, 0.60498046875, 0.7415771484375, 0.878173828125, 1.0147705078125, 1.1513671875, 1.2879638671875, 1.424560546875, 1.5611572265625, 1.69775390625, 1.8343505859375, 1.970947265625, 2.1075439453125, 2.244140625, 2.3807373046875, 2.517333984375, 2.6539306640625, 2.79052734375, 2.9271240234375, 3.063720703125, 3.2003173828125, 3.3369140625, 3.4735107421875, 3.610107421875, 3.7467041015625, 3.88330078125, 4.0198974609375, 4.156494140625, 4.2930908203125, 4.4296875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 8.0, 7.0, 9.0, 8.0, 16.0, 18.0, 22.0, 28.0, 45.0, 77.0, 136.0, 194.0, 341.0, 694.0, 1530.0, 4026.0, 13241.0, 67639.0, 420819.0, 444546.0, 73665.0, 14122.0, 4087.0, 1585.0, 734.0, 359.0, 211.0, 109.0, 80.0, 62.0, 31.0, 23.0, 22.0, 13.0, 10.0, 19.0, 3.0, 6.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09649658203125, -0.09305286407470703, -0.08960914611816406, -0.0861654281616211, -0.08272171020507812, -0.07927799224853516, -0.07583427429199219, -0.07239055633544922, -0.06894683837890625, -0.06550312042236328, -0.06205940246582031, -0.058615684509277344, -0.055171966552734375, -0.051728248596191406, -0.04828453063964844, -0.04484081268310547, -0.0413970947265625, -0.03795337677001953, -0.03450965881347656, -0.031065940856933594, -0.027622222900390625, -0.024178504943847656, -0.020734786987304688, -0.01729106903076172, -0.01384735107421875, -0.010403633117675781, -0.0069599151611328125, -0.0035161972045898438, -7.2479248046875e-05, 0.0033712387084960938, 0.0068149566650390625, 0.010258674621582031, 0.013702392578125, 0.01714611053466797, 0.020589828491210938, 0.024033546447753906, 0.027477264404296875, 0.030920982360839844, 0.03436470031738281, 0.03780841827392578, 0.04125213623046875, 0.04469585418701172, 0.04813957214355469, 0.051583290100097656, 0.055027008056640625, 0.058470726013183594, 0.06191444396972656, 0.06535816192626953, 0.0688018798828125, 0.07224559783935547, 0.07568931579589844, 0.0791330337524414, 0.08257675170898438, 0.08602046966552734, 0.08946418762207031, 0.09290790557861328, 0.09635162353515625, 0.09979534149169922, 0.10323905944824219, 0.10668277740478516, 0.11012649536132812, 0.1135702133178711, 0.11701393127441406, 0.12045764923095703, 0.1239013671875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 5.0, 4.0, 5.0, 12.0, 15.0, 26.0, 30.0, 51.0, 81.0, 120.0, 120.0, 137.0, 110.0, 79.0, 89.0, 36.0, 26.0, 26.0, 12.0, 11.0, 6.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00010401010513305664, -0.0001013539731502533, -9.869784116744995e-05, -9.60417091846466e-05, -9.338557720184326e-05, -9.072944521903992e-05, -8.807331323623657e-05, -8.541718125343323e-05, -8.276104927062988e-05, -8.010491728782654e-05, -7.74487853050232e-05, -7.479265332221985e-05, -7.21365213394165e-05, -6.948038935661316e-05, -6.682425737380981e-05, -6.416812539100647e-05, -6.151199340820312e-05, -5.885586142539978e-05, -5.6199729442596436e-05, -5.354359745979309e-05, -5.0887465476989746e-05, -4.82313334941864e-05, -4.557520151138306e-05, -4.291906952857971e-05, -4.026293754577637e-05, -3.760680556297302e-05, -3.495067358016968e-05, -3.229454159736633e-05, -2.9638409614562988e-05, -2.6982277631759644e-05, -2.43261456489563e-05, -2.1670013666152954e-05, -1.901388168334961e-05, -1.6357749700546265e-05, -1.370161771774292e-05, -1.1045485734939575e-05, -8.38935375213623e-06, -5.733221769332886e-06, -3.077089786529541e-06, -4.209578037261963e-07, 2.2351741790771484e-06, 4.891306161880493e-06, 7.547438144683838e-06, 1.0203570127487183e-05, 1.2859702110290527e-05, 1.5515834093093872e-05, 1.8171966075897217e-05, 2.082809805870056e-05, 2.3484230041503906e-05, 2.614036202430725e-05, 2.8796494007110596e-05, 3.145262598991394e-05, 3.4108757972717285e-05, 3.676488995552063e-05, 3.9421021938323975e-05, 4.207715392112732e-05, 4.4733285903930664e-05, 4.738941788673401e-05, 5.0045549869537354e-05, 5.27016818523407e-05, 5.535781383514404e-05, 5.801394581794739e-05, 6.067007780075073e-05, 6.332620978355408e-05, 6.598234176635742e-05]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 5.0, 2.0, 3.0, 4.0, 4.0, 4.0, 18.0, 4.0, 7.0, 15.0, 37.0, 95.0, 306.0, 1336.0, 25212.0, 995064.0, 24425.0, 1493.0, 309.0, 100.0, 39.0, 21.0, 12.0, 18.0, 5.0, 5.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.337890625, -0.32350921630859375, -0.3091278076171875, -0.29474639892578125, -0.280364990234375, -0.26598358154296875, -0.2516021728515625, -0.23722076416015625, -0.22283935546875, -0.20845794677734375, -0.1940765380859375, -0.17969512939453125, -0.165313720703125, -0.15093231201171875, -0.1365509033203125, -0.12216949462890625, -0.1077880859375, -0.09340667724609375, -0.0790252685546875, -0.06464385986328125, -0.050262451171875, -0.03588104248046875, -0.0214996337890625, -0.00711822509765625, 0.00726318359375, 0.02164459228515625, 0.0360260009765625, 0.05040740966796875, 0.064788818359375, 0.07917022705078125, 0.0935516357421875, 0.10793304443359375, 0.122314453125, 0.13669586181640625, 0.1510772705078125, 0.16545867919921875, 0.179840087890625, 0.19422149658203125, 0.2086029052734375, 0.22298431396484375, 0.23736572265625, 0.25174713134765625, 0.2661285400390625, 0.28050994873046875, 0.294891357421875, 0.30927276611328125, 0.3236541748046875, 0.33803558349609375, 0.3524169921875, 0.36679840087890625, 0.3811798095703125, 0.39556121826171875, 0.409942626953125, 0.42432403564453125, 0.4387054443359375, 0.45308685302734375, 0.46746826171875, 0.48184967041015625, 0.4962310791015625, 0.5106124877929688, 0.524993896484375, 0.5393753051757812, 0.5537567138671875, 0.5681381225585938, 0.58251953125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 6.0, 9.0, 10.0, 24.0, 46.0, 67.0, 104.0, 162.0, 179.0, 130.0, 95.0, 65.0, 49.0, 15.0, 10.0, 6.0, 5.0, 7.0, 2.0, 1.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07635498046875, -0.07419109344482422, -0.07202720642089844, -0.06986331939697266, -0.06769943237304688, -0.0655355453491211, -0.06337165832519531, -0.06120777130126953, -0.05904388427734375, -0.05687999725341797, -0.05471611022949219, -0.052552223205566406, -0.050388336181640625, -0.048224449157714844, -0.04606056213378906, -0.04389667510986328, -0.0417327880859375, -0.03956890106201172, -0.03740501403808594, -0.035241127014160156, -0.033077239990234375, -0.030913352966308594, -0.028749465942382812, -0.02658557891845703, -0.02442169189453125, -0.02225780487060547, -0.020093917846679688, -0.017930030822753906, -0.015766143798828125, -0.013602256774902344, -0.011438369750976562, -0.009274482727050781, -0.007110595703125, -0.004946708679199219, -0.0027828216552734375, -0.0006189346313476562, 0.001544952392578125, 0.0037088394165039062, 0.0058727264404296875, 0.008036613464355469, 0.01020050048828125, 0.012364387512207031, 0.014528274536132812, 0.016692161560058594, 0.018856048583984375, 0.021019935607910156, 0.023183822631835938, 0.02534770965576172, 0.0275115966796875, 0.02967548370361328, 0.03183937072753906, 0.034003257751464844, 0.036167144775390625, 0.038331031799316406, 0.04049491882324219, 0.04265880584716797, 0.04482269287109375, 0.04698657989501953, 0.04915046691894531, 0.051314353942871094, 0.053478240966796875, 0.055642127990722656, 0.05780601501464844, 0.05996990203857422, 0.0621337890625]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 16.0, 54.0, 124.0, 326.0, 280.0, 146.0, 48.0, 11.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.771463394165039, -15.40365982055664, -15.035855293273926, -14.668051719665527, -14.300247192382812, -13.932443618774414, -13.564640045166016, -13.1968355178833, -12.829030990600586, -12.461227416992188, -12.093422889709473, -11.725619316101074, -11.35781478881836, -10.990011215209961, -10.622207641601562, -10.254403114318848, -9.88659954071045, -9.51879596710205, -9.150991439819336, -8.783187866210938, -8.415383338928223, -8.047579765319824, -7.679775714874268, -7.311971664428711, -6.944167613983154, -6.576363563537598, -6.208559513092041, -5.840755462646484, -5.472951889038086, -5.105147361755371, -4.737343788146973, -4.369539737701416, -4.001734733581543, -3.6339306831359863, -3.2661266326904297, -2.898322820663452, -2.5305187702178955, -2.162714719772339, -1.7949109077453613, -1.4271068572998047, -1.059302806854248, -0.6914988160133362, -0.3236948251724243, 0.04410910606384277, 0.4119131565093994, 0.779717206954956, 1.1475210189819336, 1.5153250694274902, 1.8831291198730469, 2.2509331703186035, 2.61873722076416, 2.9865410327911377, 3.3543450832366943, 3.722149133682251, 4.0899529457092285, 4.457756996154785, 4.825561046600342, 5.193365097045898, 5.561169147491455, 5.928973197937012, 6.29677677154541, 6.664581298828125, 7.032384872436523, 7.40018892288208, 7.767992973327637]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 8.0, 8.0, 9.0, 11.0, 19.0, 24.0, 33.0, 27.0, 26.0, 45.0, 29.0, 55.0, 42.0, 42.0, 56.0, 61.0, 51.0, 42.0, 46.0, 50.0, 50.0, 41.0, 28.0, 57.0, 30.0, 23.0, 24.0, 15.0, 17.0, 9.0, 7.0, 8.0, 5.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2903947830200195, -3.199469566345215, -3.1085445880889893, -3.0176193714141846, -2.92669415473938, -2.8357691764831543, -2.7448439598083496, -2.653918743133545, -2.5629937648773193, -2.4720685482025146, -2.381143569946289, -2.2902183532714844, -2.1992931365966797, -2.108368158340454, -2.0174429416656494, -1.9265178442001343, -1.8355926275253296, -1.7446675300598145, -1.6537423133850098, -1.5628172159194946, -1.4718921184539795, -1.3809669017791748, -1.2900418043136597, -1.1991167068481445, -1.1081914901733398, -1.0172663927078247, -0.9263412356376648, -0.8354160785675049, -0.7444909811019897, -0.6535658240318298, -0.5626406669616699, -0.4717155694961548, -0.38079047203063965, -0.2898653447628021, -0.1989402025938034, -0.10801506042480469, -0.017089933156967163, 0.07383519411087036, 0.16476035118103027, 0.2556854486465454, 0.3466106057167053, 0.43753573298454285, 0.5284608602523804, 0.6193860173225403, 0.7103111743927002, 0.8012362718582153, 0.8921614289283752, 0.9830865263938904, 1.0740116834640503, 1.1649367809295654, 1.2558619976043701, 1.3467870950698853, 1.4377121925354004, 1.528637409210205, 1.6195625066757202, 1.7104876041412354, 1.80141282081604, 1.8923379182815552, 1.9832631349563599, 2.074188232421875, 2.1651134490966797, 2.2560384273529053, 2.34696364402771, 2.4378886222839355, 2.5288138389587402]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 4.0, 3.0, 8.0, 7.0, 7.0, 18.0, 26.0, 31.0, 41.0, 59.0, 83.0, 136.0, 200.0, 284.0, 496.0, 869.0, 1626.0, 3197.0, 7241.0, 19381.0, 61379.0, 216335.0, 447963.0, 200713.0, 56645.0, 18155.0, 6884.0, 3034.0, 1521.0, 791.0, 500.0, 315.0, 174.0, 135.0, 68.0, 62.0, 50.0, 25.0, 31.0, 12.0, 18.0, 12.0, 6.0, 1.0, 4.0, 4.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.83203125, -2.742034912109375, -2.65203857421875, -2.562042236328125, -2.4720458984375, -2.382049560546875, -2.29205322265625, -2.202056884765625, -2.112060546875, -2.022064208984375, -1.93206787109375, -1.842071533203125, -1.7520751953125, -1.662078857421875, -1.57208251953125, -1.482086181640625, -1.39208984375, -1.302093505859375, -1.21209716796875, -1.122100830078125, -1.0321044921875, -0.942108154296875, -0.85211181640625, -0.762115478515625, -0.672119140625, -0.582122802734375, -0.49212646484375, -0.402130126953125, -0.3121337890625, -0.222137451171875, -0.13214111328125, -0.042144775390625, 0.0478515625, 0.137847900390625, 0.22784423828125, 0.317840576171875, 0.4078369140625, 0.497833251953125, 0.58782958984375, 0.677825927734375, 0.767822265625, 0.857818603515625, 0.94781494140625, 1.037811279296875, 1.1278076171875, 1.217803955078125, 1.30780029296875, 1.397796630859375, 1.48779296875, 1.577789306640625, 1.66778564453125, 1.757781982421875, 1.8477783203125, 1.937774658203125, 2.02777099609375, 2.117767333984375, 2.207763671875, 2.297760009765625, 2.38775634765625, 2.477752685546875, 2.5677490234375, 2.657745361328125, 2.74774169921875, 2.837738037109375, 2.927734375]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 3.0, 2.0, 5.0, 5.0, 5.0, 8.0, 7.0, 18.0, 8.0, 16.0, 26.0, 19.0, 28.0, 21.0, 26.0, 21.0, 43.0, 34.0, 34.0, 43.0, 39.0, 33.0, 42.0, 38.0, 46.0, 55.0, 39.0, 35.0, 37.0, 26.0, 28.0, 33.0, 19.0, 30.0, 18.0, 24.0, 17.0, 14.0, 16.0, 13.0, 6.0, 10.0, 2.0, 3.0, 2.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-4.21875, -4.097930908203125, -3.97711181640625, -3.856292724609375, -3.7354736328125, -3.614654541015625, -3.49383544921875, -3.373016357421875, -3.252197265625, -3.131378173828125, -3.01055908203125, -2.889739990234375, -2.7689208984375, -2.648101806640625, -2.52728271484375, -2.406463623046875, -2.28564453125, -2.164825439453125, -2.04400634765625, -1.923187255859375, -1.8023681640625, -1.681549072265625, -1.56072998046875, -1.439910888671875, -1.319091796875, -1.198272705078125, -1.07745361328125, -0.956634521484375, -0.8358154296875, -0.714996337890625, -0.59417724609375, -0.473358154296875, -0.3525390625, -0.231719970703125, -0.11090087890625, 0.009918212890625, 0.1307373046875, 0.251556396484375, 0.37237548828125, 0.493194580078125, 0.614013671875, 0.734832763671875, 0.85565185546875, 0.976470947265625, 1.0972900390625, 1.218109130859375, 1.33892822265625, 1.459747314453125, 1.58056640625, 1.701385498046875, 1.82220458984375, 1.943023681640625, 2.0638427734375, 2.184661865234375, 2.30548095703125, 2.426300048828125, 2.547119140625, 2.667938232421875, 2.78875732421875, 2.909576416015625, 3.0303955078125, 3.151214599609375, 3.27203369140625, 3.392852783203125, 3.513671875]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 4.0, 0.0, 3.0, 5.0, 4.0, 6.0, 9.0, 6.0, 15.0, 18.0, 20.0, 31.0, 33.0, 51.0, 75.0, 112.0, 159.0, 232.0, 793.0, 42468.0, 997982.0, 5408.0, 444.0, 212.0, 135.0, 86.0, 72.0, 49.0, 37.0, 22.0, 24.0, 13.0, 7.0, 4.0, 7.0, 3.0, 1.0, 3.0, 3.0, 0.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-20.875, -20.28369140625, -19.6923828125, -19.10107421875, -18.509765625, -17.91845703125, -17.3271484375, -16.73583984375, -16.14453125, -15.55322265625, -14.9619140625, -14.37060546875, -13.779296875, -13.18798828125, -12.5966796875, -12.00537109375, -11.4140625, -10.82275390625, -10.2314453125, -9.64013671875, -9.048828125, -8.45751953125, -7.8662109375, -7.27490234375, -6.68359375, -6.09228515625, -5.5009765625, -4.90966796875, -4.318359375, -3.72705078125, -3.1357421875, -2.54443359375, -1.953125, -1.36181640625, -0.7705078125, -0.17919921875, 0.412109375, 1.00341796875, 1.5947265625, 2.18603515625, 2.77734375, 3.36865234375, 3.9599609375, 4.55126953125, 5.142578125, 5.73388671875, 6.3251953125, 6.91650390625, 7.5078125, 8.09912109375, 8.6904296875, 9.28173828125, 9.873046875, 10.46435546875, 11.0556640625, 11.64697265625, 12.23828125, 12.82958984375, 13.4208984375, 14.01220703125, 14.603515625, 15.19482421875, 15.7861328125, 16.37744140625, 16.96875]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 3.0, 3.0, 5.0, 12.0, 7.0, 10.0, 11.0, 19.0, 35.0, 35.0, 45.0, 57.0, 60.0, 51.0, 43.0, 60.0, 71.0, 67.0, 62.0, 62.0, 51.0, 39.0, 29.0, 37.0, 32.0, 26.0, 15.0, 12.0, 16.0, 8.0, 6.0, 6.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-7.96484375, -7.759033203125, -7.55322265625, -7.347412109375, -7.1416015625, -6.935791015625, -6.72998046875, -6.524169921875, -6.318359375, -6.112548828125, -5.90673828125, -5.700927734375, -5.4951171875, -5.289306640625, -5.08349609375, -4.877685546875, -4.671875, -4.466064453125, -4.26025390625, -4.054443359375, -3.8486328125, -3.642822265625, -3.43701171875, -3.231201171875, -3.025390625, -2.819580078125, -2.61376953125, -2.407958984375, -2.2021484375, -1.996337890625, -1.79052734375, -1.584716796875, -1.37890625, -1.173095703125, -0.96728515625, -0.761474609375, -0.5556640625, -0.349853515625, -0.14404296875, 0.061767578125, 0.267578125, 0.473388671875, 0.67919921875, 0.885009765625, 1.0908203125, 1.296630859375, 1.50244140625, 1.708251953125, 1.9140625, 2.119873046875, 2.32568359375, 2.531494140625, 2.7373046875, 2.943115234375, 3.14892578125, 3.354736328125, 3.560546875, 3.766357421875, 3.97216796875, 4.177978515625, 4.3837890625, 4.589599609375, 4.79541015625, 5.001220703125, 5.20703125]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 2.0, 2.0, 11.0, 12.0, 18.0, 36.0, 51.0, 133.0, 564.0, 9372.0, 1022612.0, 14689.0, 728.0, 145.0, 63.0, 43.0, 23.0, 15.0, 10.0, 10.0, 2.0, 5.0, 2.0, 2.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.8046875, -5.60137939453125, -5.3980712890625, -5.19476318359375, -4.991455078125, -4.78814697265625, -4.5848388671875, -4.38153076171875, -4.17822265625, -3.97491455078125, -3.7716064453125, -3.56829833984375, -3.364990234375, -3.16168212890625, -2.9583740234375, -2.75506591796875, -2.5517578125, -2.34844970703125, -2.1451416015625, -1.94183349609375, -1.738525390625, -1.53521728515625, -1.3319091796875, -1.12860107421875, -0.92529296875, -0.72198486328125, -0.5186767578125, -0.31536865234375, -0.112060546875, 0.09124755859375, 0.2945556640625, 0.49786376953125, 0.701171875, 0.90447998046875, 1.1077880859375, 1.31109619140625, 1.514404296875, 1.71771240234375, 1.9210205078125, 2.12432861328125, 2.32763671875, 2.53094482421875, 2.7342529296875, 2.93756103515625, 3.140869140625, 3.34417724609375, 3.5474853515625, 3.75079345703125, 3.9541015625, 4.15740966796875, 4.3607177734375, 4.56402587890625, 4.767333984375, 4.97064208984375, 5.1739501953125, 5.37725830078125, 5.58056640625, 5.78387451171875, 5.9871826171875, 6.19049072265625, 6.393798828125, 6.59710693359375, 6.8004150390625, 7.00372314453125, 7.20703125]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 1.0, 2.0, 5.0, 7.0, 15.0, 16.0, 22.0, 33.0, 52.0, 89.0, 124.0, 160.0, 136.0, 123.0, 83.0, 39.0, 29.0, 25.0, 17.0, 7.0, 8.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00023257732391357422, -0.00022476725280284882, -0.0002169571816921234, -0.000209147110581398, -0.0002013370394706726, -0.0001935269683599472, -0.0001857168972492218, -0.0001779068261384964, -0.000170096755027771, -0.0001622866839170456, -0.0001544766128063202, -0.0001466665416955948, -0.00013885647058486938, -0.00013104639947414398, -0.00012323632836341858, -0.00011542625725269318, -0.00010761618614196777, -9.980611503124237e-05, -9.199604392051697e-05, -8.418597280979156e-05, -7.637590169906616e-05, -6.856583058834076e-05, -6.0755759477615356e-05, -5.2945688366889954e-05, -4.513561725616455e-05, -3.732554614543915e-05, -2.9515475034713745e-05, -2.1705403923988342e-05, -1.389533281326294e-05, -6.085261702537537e-06, 1.7248094081878662e-06, 9.534880518913269e-06, 1.7344951629638672e-05, 2.5155022740364075e-05, 3.296509385108948e-05, 4.077516496181488e-05, 4.858523607254028e-05, 5.6395307183265686e-05, 6.420537829399109e-05, 7.201544940471649e-05, 7.98255205154419e-05, 8.76355916261673e-05, 9.54456627368927e-05, 0.0001032557338476181, 0.0001110658049583435, 0.00011887587606906891, 0.0001266859471797943, 0.00013449601829051971, 0.00014230608940124512, 0.00015011616051197052, 0.00015792623162269592, 0.00016573630273342133, 0.00017354637384414673, 0.00018135644495487213, 0.00018916651606559753, 0.00019697658717632294, 0.00020478665828704834, 0.00021259672939777374, 0.00022040680050849915, 0.00022821687161922455, 0.00023602694272994995, 0.00024383701384067535, 0.00025164708495140076, 0.00025945715606212616, 0.00026726722717285156]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 9.0, 4.0, 2.0, 8.0, 15.0, 19.0, 18.0, 25.0, 53.0, 83.0, 125.0, 450.0, 5078.0, 823433.0, 216085.0, 2491.0, 356.0, 108.0, 69.0, 35.0, 29.0, 14.0, 15.0, 6.0, 5.0, 6.0, 3.0, 6.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.0234375, -5.860107421875, -5.69677734375, -5.533447265625, -5.3701171875, -5.206787109375, -5.04345703125, -4.880126953125, -4.716796875, -4.553466796875, -4.39013671875, -4.226806640625, -4.0634765625, -3.900146484375, -3.73681640625, -3.573486328125, -3.41015625, -3.246826171875, -3.08349609375, -2.920166015625, -2.7568359375, -2.593505859375, -2.43017578125, -2.266845703125, -2.103515625, -1.940185546875, -1.77685546875, -1.613525390625, -1.4501953125, -1.286865234375, -1.12353515625, -0.960205078125, -0.796875, -0.633544921875, -0.47021484375, -0.306884765625, -0.1435546875, 0.019775390625, 0.18310546875, 0.346435546875, 0.509765625, 0.673095703125, 0.83642578125, 0.999755859375, 1.1630859375, 1.326416015625, 1.48974609375, 1.653076171875, 1.81640625, 1.979736328125, 2.14306640625, 2.306396484375, 2.4697265625, 2.633056640625, 2.79638671875, 2.959716796875, 3.123046875, 3.286376953125, 3.44970703125, 3.613037109375, 3.7763671875, 3.939697265625, 4.10302734375, 4.266357421875, 4.4296875]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 6.0, 7.0, 7.0, 5.0, 7.0, 10.0, 11.0, 15.0, 27.0, 29.0, 39.0, 62.0, 76.0, 90.0, 108.0, 96.0, 97.0, 85.0, 48.0, 44.0, 25.0, 21.0, 21.0, 12.0, 12.0, 9.0, 13.0, 5.0, 5.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.52001953125, -0.5020980834960938, -0.4841766357421875, -0.46625518798828125, -0.448333740234375, -0.43041229248046875, -0.4124908447265625, -0.39456939697265625, -0.37664794921875, -0.35872650146484375, -0.3408050537109375, -0.32288360595703125, -0.304962158203125, -0.28704071044921875, -0.2691192626953125, -0.25119781494140625, -0.2332763671875, -0.21535491943359375, -0.1974334716796875, -0.17951202392578125, -0.161590576171875, -0.14366912841796875, -0.1257476806640625, -0.10782623291015625, -0.08990478515625, -0.07198333740234375, -0.0540618896484375, -0.03614044189453125, -0.018218994140625, -0.00029754638671875, 0.0176239013671875, 0.03554534912109375, 0.053466796875, 0.07138824462890625, 0.0893096923828125, 0.10723114013671875, 0.125152587890625, 0.14307403564453125, 0.1609954833984375, 0.17891693115234375, 0.19683837890625, 0.21475982666015625, 0.2326812744140625, 0.25060272216796875, 0.268524169921875, 0.28644561767578125, 0.3043670654296875, 0.32228851318359375, 0.3402099609375, 0.35813140869140625, 0.3760528564453125, 0.39397430419921875, 0.411895751953125, 0.42981719970703125, 0.4477386474609375, 0.46566009521484375, 0.48358154296875, 0.5015029907226562, 0.5194244384765625, 0.5373458862304688, 0.555267333984375, 0.5731887817382812, 0.5911102294921875, 0.6090316772460938, 0.626953125]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 15.0, 168.0, 620.0, 193.0, 16.0, 0.0, 1.0, 1.0], "bins": [-85.31723022460938, -83.857666015625, -82.3980941772461, -80.93852996826172, -79.47895812988281, -78.01939392089844, -76.55982971191406, -75.10025787353516, -73.64069366455078, -72.1811294555664, -70.7215576171875, -69.26199340820312, -67.80242156982422, -66.34285736083984, -64.88328552246094, -63.42372131347656, -61.96415328979492, -60.50458526611328, -59.04501724243164, -57.58544921875, -56.125885009765625, -54.666316986083984, -53.206748962402344, -51.7471809387207, -50.28761291503906, -48.82804489135742, -47.36847686767578, -45.908912658691406, -44.449344635009766, -42.989776611328125, -41.530208587646484, -40.070640563964844, -38.61107635498047, -37.15150833129883, -35.69194030761719, -34.23237609863281, -32.77280807495117, -31.31324005126953, -29.85367202758789, -28.39410400390625, -26.93453598022461, -25.47496795654297, -24.01540184020996, -22.55583381652832, -21.096267700195312, -19.636699676513672, -18.17713165283203, -16.71756362915039, -15.2579984664917, -13.798431396484375, -12.338863372802734, -10.87929630279541, -9.419729232788086, -7.960162162780762, -6.500594139099121, -5.041027069091797, -3.5814599990844727, -2.1218926906585693, -0.662325382232666, 0.7972421646118164, 2.2568092346191406, 3.716376304626465, 5.1759443283081055, 6.63551139831543, 8.095078468322754]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 7.0, 8.0, 12.0, 17.0, 15.0, 25.0, 35.0, 33.0, 36.0, 50.0, 46.0, 42.0, 57.0, 55.0, 54.0, 60.0, 64.0, 45.0, 52.0, 52.0, 39.0, 36.0, 32.0, 34.0, 24.0, 29.0, 21.0, 13.0, 5.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-12.296927452087402, -12.023918151855469, -11.750909805297852, -11.477900505065918, -11.2048921585083, -10.931882858276367, -10.65887451171875, -10.385865211486816, -10.112855911254883, -9.83984661102295, -9.566838264465332, -9.293828964233398, -9.020820617675781, -8.747811317443848, -8.474802017211914, -8.201793670654297, -7.9287848472595215, -7.655776023864746, -7.382767200469971, -7.109758377075195, -6.836749076843262, -6.563740253448486, -6.290731430053711, -6.0177226066589355, -5.74471378326416, -5.471704959869385, -5.198696136474609, -4.925686836242676, -4.6526780128479, -4.379669189453125, -4.10666036605835, -3.833651542663574, -3.5606422424316406, -3.2876334190368652, -3.0146243572235107, -2.7416155338287354, -2.468606472015381, -2.1955976486206055, -1.92258882522583, -1.6495798826217651, -1.3765709400177002, -1.1035619974136353, -0.8305531144142151, -0.5575442314147949, -0.28453528881073, -0.011526346206665039, 0.26148247718811035, 0.5344914197921753, 0.8075003623962402, 1.0805093050003052, 1.3535182476043701, 1.6265270709991455, 1.8995360136032104, 2.1725449562072754, 2.445553779602051, 2.718562602996826, 2.9915716648101807, 3.264580488204956, 3.5375895500183105, 3.810598373413086, 4.083607196807861, 4.356616020202637, 4.62962532043457, 4.902634143829346, 5.175642967224121]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 4.0, 8.0, 9.0, 11.0, 14.0, 15.0, 18.0, 31.0, 46.0, 52.0, 68.0, 109.0, 158.0, 224.0, 459.0, 1030.0, 3160.0, 14816.0, 116820.0, 1104153.0, 2380266.0, 508989.0, 51117.0, 8597.0, 2405.0, 840.0, 303.0, 178.0, 107.0, 78.0, 38.0, 47.0, 30.0, 18.0, 11.0, 9.0, 8.0, 13.0, 11.0, 5.0, 2.0, 4.0, 2.0, 1.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-4.33203125, -4.17340087890625, -4.0147705078125, -3.85614013671875, -3.697509765625, -3.53887939453125, -3.3802490234375, -3.22161865234375, -3.06298828125, -2.90435791015625, -2.7457275390625, -2.58709716796875, -2.428466796875, -2.26983642578125, -2.1112060546875, -1.95257568359375, -1.7939453125, -1.63531494140625, -1.4766845703125, -1.31805419921875, -1.159423828125, -1.00079345703125, -0.8421630859375, -0.68353271484375, -0.52490234375, -0.36627197265625, -0.2076416015625, -0.04901123046875, 0.109619140625, 0.26824951171875, 0.4268798828125, 0.58551025390625, 0.744140625, 0.90277099609375, 1.0614013671875, 1.22003173828125, 1.378662109375, 1.53729248046875, 1.6959228515625, 1.85455322265625, 2.01318359375, 2.17181396484375, 2.3304443359375, 2.48907470703125, 2.647705078125, 2.80633544921875, 2.9649658203125, 3.12359619140625, 3.2822265625, 3.44085693359375, 3.5994873046875, 3.75811767578125, 3.916748046875, 4.07537841796875, 4.2340087890625, 4.39263916015625, 4.55126953125, 4.70989990234375, 4.8685302734375, 5.02716064453125, 5.185791015625, 5.34442138671875, 5.5030517578125, 5.66168212890625, 5.8203125]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 3.0, 1.0, 7.0, 11.0, 9.0, 26.0, 25.0, 36.0, 46.0, 47.0, 53.0, 55.0, 46.0, 53.0, 51.0, 89.0, 67.0, 62.0, 57.0, 54.0, 42.0, 32.0, 22.0, 36.0, 21.0, 19.0, 13.0, 7.0, 7.0, 7.0, 4.0, 0.0, 1.0, 2.0], "bins": [-5.578125, -5.454620361328125, -5.33111572265625, -5.207611083984375, -5.0841064453125, -4.960601806640625, -4.83709716796875, -4.713592529296875, -4.590087890625, -4.466583251953125, -4.34307861328125, -4.219573974609375, -4.0960693359375, -3.972564697265625, -3.84906005859375, -3.725555419921875, -3.60205078125, -3.478546142578125, -3.35504150390625, -3.231536865234375, -3.1080322265625, -2.984527587890625, -2.86102294921875, -2.737518310546875, -2.614013671875, -2.490509033203125, -2.36700439453125, -2.243499755859375, -2.1199951171875, -1.996490478515625, -1.87298583984375, -1.749481201171875, -1.6259765625, -1.502471923828125, -1.37896728515625, -1.255462646484375, -1.1319580078125, -1.008453369140625, -0.88494873046875, -0.761444091796875, -0.637939453125, -0.514434814453125, -0.39093017578125, -0.267425537109375, -0.1439208984375, -0.020416259765625, 0.10308837890625, 0.226593017578125, 0.35009765625, 0.473602294921875, 0.59710693359375, 0.720611572265625, 0.8441162109375, 0.967620849609375, 1.09112548828125, 1.214630126953125, 1.338134765625, 1.461639404296875, 1.58514404296875, 1.708648681640625, 1.8321533203125, 1.955657958984375, 2.07916259765625, 2.202667236328125, 2.326171875]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 4.0, 14.0, 15.0, 26.0, 60.0, 127.0, 371.0, 1872.0, 334143.0, 3851824.0, 4903.0, 562.0, 194.0, 71.0, 32.0, 24.0, 10.0, 5.0, 4.0, 5.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.109375, -16.4794921875, -15.849609375, -15.2197265625, -14.58984375, -13.9599609375, -13.330078125, -12.7001953125, -12.0703125, -11.4404296875, -10.810546875, -10.1806640625, -9.55078125, -8.9208984375, -8.291015625, -7.6611328125, -7.03125, -6.4013671875, -5.771484375, -5.1416015625, -4.51171875, -3.8818359375, -3.251953125, -2.6220703125, -1.9921875, -1.3623046875, -0.732421875, -0.1025390625, 0.52734375, 1.1572265625, 1.787109375, 2.4169921875, 3.046875, 3.6767578125, 4.306640625, 4.9365234375, 5.56640625, 6.1962890625, 6.826171875, 7.4560546875, 8.0859375, 8.7158203125, 9.345703125, 9.9755859375, 10.60546875, 11.2353515625, 11.865234375, 12.4951171875, 13.125, 13.7548828125, 14.384765625, 15.0146484375, 15.64453125, 16.2744140625, 16.904296875, 17.5341796875, 18.1640625, 18.7939453125, 19.423828125, 20.0537109375, 20.68359375, 21.3134765625, 21.943359375, 22.5732421875, 23.203125]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 8.0, 4.0, 14.0, 14.0, 25.0, 32.0, 63.0, 85.0, 134.0, 216.0, 317.0, 529.0, 643.0, 676.0, 485.0, 303.0, 192.0, 109.0, 78.0, 48.0, 39.0, 19.0, 16.0, 13.0, 1.0, 5.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.87109375, -1.814117431640625, -1.75714111328125, -1.700164794921875, -1.6431884765625, -1.586212158203125, -1.52923583984375, -1.472259521484375, -1.415283203125, -1.358306884765625, -1.30133056640625, -1.244354248046875, -1.1873779296875, -1.130401611328125, -1.07342529296875, -1.016448974609375, -0.95947265625, -0.902496337890625, -0.84552001953125, -0.788543701171875, -0.7315673828125, -0.674591064453125, -0.61761474609375, -0.560638427734375, -0.503662109375, -0.446685791015625, -0.38970947265625, -0.332733154296875, -0.2757568359375, -0.218780517578125, -0.16180419921875, -0.104827880859375, -0.0478515625, 0.009124755859375, 0.06610107421875, 0.123077392578125, 0.1800537109375, 0.237030029296875, 0.29400634765625, 0.350982666015625, 0.407958984375, 0.464935302734375, 0.52191162109375, 0.578887939453125, 0.6358642578125, 0.692840576171875, 0.74981689453125, 0.806793212890625, 0.86376953125, 0.920745849609375, 0.97772216796875, 1.034698486328125, 1.0916748046875, 1.148651123046875, 1.20562744140625, 1.262603759765625, 1.319580078125, 1.376556396484375, 1.43353271484375, 1.490509033203125, 1.5474853515625, 1.604461669921875, 1.66143798828125, 1.718414306640625, 1.775390625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 13.0, 36.0, 64.0, 100.0, 202.0, 204.0, 174.0, 108.0, 62.0, 31.0, 6.0, 3.0, 2.0], "bins": [-20.78423500061035, -20.415246963500977, -20.04625701904297, -19.677268981933594, -19.30828094482422, -18.939292907714844, -18.570302963256836, -18.20131492614746, -17.832326889038086, -17.46333885192871, -17.094348907470703, -16.725360870361328, -16.356372833251953, -15.987383842468262, -15.61839485168457, -15.249406814575195, -14.880417823791504, -14.511428833007812, -14.142440795898438, -13.773451805114746, -13.404463768005371, -13.03547477722168, -12.666486740112305, -12.297497749328613, -11.928508758544922, -11.55951976776123, -11.190531730651855, -10.821542739868164, -10.452554702758789, -10.083565711975098, -9.714576721191406, -9.345588684082031, -8.976601600646973, -8.607612609863281, -8.238624572753906, -7.869635581970215, -7.50064754486084, -7.131658554077148, -6.762670040130615, -6.393681526184082, -6.024693012237549, -5.655704498291016, -5.286715984344482, -4.917727470397949, -4.548738479614258, -4.179750442504883, -3.8107614517211914, -3.441772937774658, -3.072784423828125, -2.703795909881592, -2.3348073959350586, -1.9658186435699463, -1.596830129623413, -1.2278416156768799, -0.8588528633117676, -0.4898643493652344, -0.12087583541870117, 0.2481127381324768, 0.6171013116836548, 0.9860899448394775, 1.3550784587860107, 1.724066972732544, 2.0930557250976562, 2.4620442390441895, 2.8310327529907227]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 6.0, 8.0, 10.0, 11.0, 22.0, 20.0, 26.0, 26.0, 39.0, 24.0, 38.0, 50.0, 43.0, 54.0, 62.0, 70.0, 49.0, 59.0, 58.0, 64.0, 48.0, 33.0, 28.0, 39.0, 16.0, 30.0, 22.0, 15.0, 12.0, 10.0, 4.0, 0.0, 6.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.130297660827637, -3.998098850250244, -3.8659000396728516, -3.733701229095459, -3.6015024185180664, -3.469303607940674, -3.3371047973632812, -3.2049059867858887, -3.072707176208496, -2.9405083656311035, -2.808309555053711, -2.6761107444763184, -2.543911933898926, -2.411713123321533, -2.2795143127441406, -2.147315502166748, -2.0151166915893555, -1.882917881011963, -1.7507190704345703, -1.6185202598571777, -1.4863214492797852, -1.3541226387023926, -1.221923828125, -1.0897250175476074, -0.9575262069702148, -0.8253273963928223, -0.6931285858154297, -0.5609297752380371, -0.42873096466064453, -0.29653215408325195, -0.16433334350585938, -0.0321345329284668, 0.10006427764892578, 0.23226308822631836, 0.36446189880371094, 0.4966607093811035, 0.6288595199584961, 0.7610583305358887, 0.8932571411132812, 1.0254559516906738, 1.1576547622680664, 1.289853572845459, 1.4220523834228516, 1.5542511940002441, 1.6864500045776367, 1.8186488151550293, 1.9508476257324219, 2.0830464363098145, 2.215245246887207, 2.3474440574645996, 2.479642868041992, 2.6118416786193848, 2.7440404891967773, 2.87623929977417, 3.0084381103515625, 3.140636920928955, 3.2728357315063477, 3.4050345420837402, 3.537233352661133, 3.6694321632385254, 3.801630973815918, 3.9338297843933105, 4.066028594970703, 4.198227405548096, 4.330426216125488]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 5.0, 3.0, 4.0, 2.0, 6.0, 7.0, 12.0, 11.0, 21.0, 38.0, 50.0, 82.0, 131.0, 218.0, 440.0, 784.0, 1471.0, 3361.0, 9095.0, 42916.0, 325214.0, 551282.0, 89545.0, 15099.0, 4552.0, 1968.0, 985.0, 519.0, 298.0, 149.0, 107.0, 61.0, 48.0, 28.0, 18.0, 9.0, 5.0, 6.0, 4.0, 5.0, 0.0, 0.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.9404296875, -0.9030914306640625, -0.865753173828125, -0.8284149169921875, -0.79107666015625, -0.7537384033203125, -0.716400146484375, -0.6790618896484375, -0.6417236328125, -0.6043853759765625, -0.567047119140625, -0.5297088623046875, -0.49237060546875, -0.4550323486328125, -0.417694091796875, -0.3803558349609375, -0.343017578125, -0.3056793212890625, -0.268341064453125, -0.2310028076171875, -0.19366455078125, -0.1563262939453125, -0.118988037109375, -0.0816497802734375, -0.0443115234375, -0.0069732666015625, 0.030364990234375, 0.0677032470703125, 0.10504150390625, 0.1423797607421875, 0.179718017578125, 0.2170562744140625, 0.25439453125, 0.2917327880859375, 0.329071044921875, 0.3664093017578125, 0.40374755859375, 0.4410858154296875, 0.478424072265625, 0.5157623291015625, 0.5531005859375, 0.5904388427734375, 0.627777099609375, 0.6651153564453125, 0.70245361328125, 0.7397918701171875, 0.777130126953125, 0.8144683837890625, 0.851806640625, 0.8891448974609375, 0.926483154296875, 0.9638214111328125, 1.00115966796875, 1.0384979248046875, 1.075836181640625, 1.1131744384765625, 1.1505126953125, 1.1878509521484375, 1.225189208984375, 1.2625274658203125, 1.29986572265625, 1.3372039794921875, 1.374542236328125, 1.4118804931640625, 1.44921875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 6.0, 13.0, 14.0, 19.0, 24.0, 15.0, 34.0, 28.0, 31.0, 47.0, 48.0, 46.0, 63.0, 65.0, 66.0, 80.0, 56.0, 63.0, 55.0, 44.0, 36.0, 38.0, 20.0, 32.0, 24.0, 15.0, 7.0, 3.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.556640625, -3.466522216796875, -3.37640380859375, -3.286285400390625, -3.1961669921875, -3.106048583984375, -3.01593017578125, -2.925811767578125, -2.835693359375, -2.745574951171875, -2.65545654296875, -2.565338134765625, -2.4752197265625, -2.385101318359375, -2.29498291015625, -2.204864501953125, -2.11474609375, -2.024627685546875, -1.93450927734375, -1.844390869140625, -1.7542724609375, -1.664154052734375, -1.57403564453125, -1.483917236328125, -1.393798828125, -1.303680419921875, -1.21356201171875, -1.123443603515625, -1.0333251953125, -0.943206787109375, -0.85308837890625, -0.762969970703125, -0.6728515625, -0.582733154296875, -0.49261474609375, -0.402496337890625, -0.3123779296875, -0.222259521484375, -0.13214111328125, -0.042022705078125, 0.048095703125, 0.138214111328125, 0.22833251953125, 0.318450927734375, 0.4085693359375, 0.498687744140625, 0.58880615234375, 0.678924560546875, 0.76904296875, 0.859161376953125, 0.94927978515625, 1.039398193359375, 1.1295166015625, 1.219635009765625, 1.30975341796875, 1.399871826171875, 1.489990234375, 1.580108642578125, 1.67022705078125, 1.760345458984375, 1.8504638671875, 1.940582275390625, 2.03070068359375, 2.120819091796875, 2.2109375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 9.0, 11.0, 11.0, 27.0, 17.0, 46.0, 56.0, 81.0, 120.0, 162.0, 238.0, 356.0, 569.0, 826.0, 1421.0, 2224.0, 3783.0, 6582.0, 11952.0, 21316.0, 39950.0, 73557.0, 128638.0, 192301.0, 206584.0, 153791.0, 91582.0, 49808.0, 27328.0, 14734.0, 8248.0, 4775.0, 2735.0, 1671.0, 1017.0, 630.0, 467.0, 296.0, 197.0, 125.0, 83.0, 64.0, 47.0, 38.0, 21.0, 22.0, 11.0, 10.0, 10.0, 8.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2496337890625, -0.24162864685058594, -0.23362350463867188, -0.2256183624267578, -0.21761322021484375, -0.2096080780029297, -0.20160293579101562, -0.19359779357910156, -0.1855926513671875, -0.17758750915527344, -0.16958236694335938, -0.1615772247314453, -0.15357208251953125, -0.1455669403076172, -0.13756179809570312, -0.12955665588378906, -0.121551513671875, -0.11354637145996094, -0.10554122924804688, -0.09753608703613281, -0.08953094482421875, -0.08152580261230469, -0.07352066040039062, -0.06551551818847656, -0.0575103759765625, -0.04950523376464844, -0.041500091552734375, -0.03349494934082031, -0.02548980712890625, -0.017484664916992188, -0.009479522705078125, -0.0014743804931640625, 0.00653076171875, 0.014535903930664062, 0.022541046142578125, 0.030546188354492188, 0.03855133056640625, 0.04655647277832031, 0.054561614990234375, 0.06256675720214844, 0.0705718994140625, 0.07857704162597656, 0.08658218383789062, 0.09458732604980469, 0.10259246826171875, 0.11059761047363281, 0.11860275268554688, 0.12660789489746094, 0.134613037109375, 0.14261817932128906, 0.15062332153320312, 0.1586284637451172, 0.16663360595703125, 0.1746387481689453, 0.18264389038085938, 0.19064903259277344, 0.1986541748046875, 0.20665931701660156, 0.21466445922851562, 0.2226696014404297, 0.23067474365234375, 0.2386798858642578, 0.24668502807617188, 0.25469017028808594, 0.2626953125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 3.0, 0.0, 7.0, 11.0, 7.0, 12.0, 18.0, 18.0, 14.0, 13.0, 25.0, 30.0, 41.0, 51.0, 48.0, 60.0, 48.0, 50.0, 60.0, 59.0, 52.0, 57.0, 37.0, 44.0, 41.0, 36.0, 25.0, 23.0, 33.0, 18.0, 15.0, 8.0, 6.0, 9.0, 7.0, 6.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0], "bins": [-4.6015625, -4.460205078125, -4.31884765625, -4.177490234375, -4.0361328125, -3.894775390625, -3.75341796875, -3.612060546875, -3.470703125, -3.329345703125, -3.18798828125, -3.046630859375, -2.9052734375, -2.763916015625, -2.62255859375, -2.481201171875, -2.33984375, -2.198486328125, -2.05712890625, -1.915771484375, -1.7744140625, -1.633056640625, -1.49169921875, -1.350341796875, -1.208984375, -1.067626953125, -0.92626953125, -0.784912109375, -0.6435546875, -0.502197265625, -0.36083984375, -0.219482421875, -0.078125, 0.063232421875, 0.20458984375, 0.345947265625, 0.4873046875, 0.628662109375, 0.77001953125, 0.911376953125, 1.052734375, 1.194091796875, 1.33544921875, 1.476806640625, 1.6181640625, 1.759521484375, 1.90087890625, 2.042236328125, 2.18359375, 2.324951171875, 2.46630859375, 2.607666015625, 2.7490234375, 2.890380859375, 3.03173828125, 3.173095703125, 3.314453125, 3.455810546875, 3.59716796875, 3.738525390625, 3.8798828125, 4.021240234375, 4.16259765625, 4.303955078125, 4.4453125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 6.0, 8.0, 8.0, 13.0, 17.0, 20.0, 36.0, 49.0, 71.0, 112.0, 167.0, 258.0, 412.0, 727.0, 1465.0, 3459.0, 9148.0, 31091.0, 131849.0, 444928.0, 319329.0, 75059.0, 19021.0, 6267.0, 2423.0, 1052.0, 583.0, 344.0, 183.0, 118.0, 100.0, 63.0, 46.0, 30.0, 23.0, 14.0, 16.0, 13.0, 12.0, 6.0, 2.0, 4.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0673828125, -0.06519603729248047, -0.06300926208496094, -0.060822486877441406, -0.058635711669921875, -0.056448936462402344, -0.05426216125488281, -0.05207538604736328, -0.04988861083984375, -0.04770183563232422, -0.04551506042480469, -0.043328285217285156, -0.041141510009765625, -0.038954734802246094, -0.03676795959472656, -0.03458118438720703, -0.0323944091796875, -0.03020763397216797, -0.028020858764648438, -0.025834083557128906, -0.023647308349609375, -0.021460533142089844, -0.019273757934570312, -0.01708698272705078, -0.01490020751953125, -0.012713432312011719, -0.010526657104492188, -0.008339881896972656, -0.006153106689453125, -0.003966331481933594, -0.0017795562744140625, 0.00040721893310546875, 0.002593994140625, 0.004780769348144531, 0.0069675445556640625, 0.009154319763183594, 0.011341094970703125, 0.013527870178222656, 0.015714645385742188, 0.01790142059326172, 0.02008819580078125, 0.02227497100830078, 0.024461746215820312, 0.026648521423339844, 0.028835296630859375, 0.031022071838378906, 0.03320884704589844, 0.03539562225341797, 0.0375823974609375, 0.03976917266845703, 0.04195594787597656, 0.044142723083496094, 0.046329498291015625, 0.048516273498535156, 0.05070304870605469, 0.05288982391357422, 0.05507659912109375, 0.05726337432861328, 0.05945014953613281, 0.061636924743652344, 0.06382369995117188, 0.0660104751586914, 0.06819725036621094, 0.07038402557373047, 0.07257080078125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 1.0, 7.0, 7.0, 10.0, 15.0, 7.0, 15.0, 16.0, 36.0, 36.0, 42.0, 49.0, 50.0, 75.0, 72.0, 68.0, 65.0, 81.0, 70.0, 63.0, 41.0, 39.0, 32.0, 22.0, 20.0, 14.0, 12.0, 6.0, 8.0, 5.0, 1.0, 4.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.349781036376953e-05, -3.233086317777634e-05, -3.116391599178314e-05, -2.9996968805789948e-05, -2.8830021619796753e-05, -2.766307443380356e-05, -2.6496127247810364e-05, -2.532918006181717e-05, -2.4162232875823975e-05, -2.299528568983078e-05, -2.1828338503837585e-05, -2.066139131784439e-05, -1.9494444131851196e-05, -1.8327496945858002e-05, -1.7160549759864807e-05, -1.5993602573871613e-05, -1.4826655387878418e-05, -1.3659708201885223e-05, -1.2492761015892029e-05, -1.1325813829898834e-05, -1.015886664390564e-05, -8.991919457912445e-06, -7.82497227191925e-06, -6.658025085926056e-06, -5.491077899932861e-06, -4.324130713939667e-06, -3.157183527946472e-06, -1.9902363419532776e-06, -8.23289155960083e-07, 3.4365803003311157e-07, 1.5106052160263062e-06, 2.6775524020195007e-06, 3.844499588012695e-06, 5.01144677400589e-06, 6.1783939599990845e-06, 7.345341145992279e-06, 8.512288331985474e-06, 9.679235517978668e-06, 1.0846182703971863e-05, 1.2013129889965057e-05, 1.3180077075958252e-05, 1.4347024261951447e-05, 1.551397144794464e-05, 1.6680918633937836e-05, 1.784786581993103e-05, 1.9014813005924225e-05, 2.018176019191742e-05, 2.1348707377910614e-05, 2.251565456390381e-05, 2.3682601749897003e-05, 2.4849548935890198e-05, 2.6016496121883392e-05, 2.7183443307876587e-05, 2.835039049386978e-05, 2.9517337679862976e-05, 3.068428486585617e-05, 3.1851232051849365e-05, 3.301817923784256e-05, 3.4185126423835754e-05, 3.535207360982895e-05, 3.6519020795822144e-05, 3.768596798181534e-05, 3.885291516780853e-05, 4.001986235380173e-05, 4.118680953979492e-05]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 3.0, 4.0, 8.0, 2.0, 11.0, 14.0, 15.0, 23.0, 26.0, 33.0, 50.0, 97.0, 178.0, 362.0, 800.0, 2223.0, 7223.0, 29406.0, 206644.0, 641897.0, 129950.0, 20968.0, 5475.0, 1762.0, 685.0, 307.0, 136.0, 74.0, 55.0, 35.0, 23.0, 20.0, 11.0, 9.0, 8.0, 7.0, 3.0, 2.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.10406494140625, -0.10074996948242188, -0.09743499755859375, -0.09412002563476562, -0.0908050537109375, -0.08749008178710938, -0.08417510986328125, -0.08086013793945312, -0.077545166015625, -0.07423019409179688, -0.07091522216796875, -0.06760025024414062, -0.0642852783203125, -0.060970306396484375, -0.05765533447265625, -0.054340362548828125, -0.051025390625, -0.047710418701171875, -0.04439544677734375, -0.041080474853515625, -0.0377655029296875, -0.034450531005859375, -0.03113555908203125, -0.027820587158203125, -0.024505615234375, -0.021190643310546875, -0.01787567138671875, -0.014560699462890625, -0.0112457275390625, -0.007930755615234375, -0.00461578369140625, -0.001300811767578125, 0.00201416015625, 0.005329132080078125, 0.00864410400390625, 0.011959075927734375, 0.0152740478515625, 0.018589019775390625, 0.02190399169921875, 0.025218963623046875, 0.028533935546875, 0.031848907470703125, 0.03516387939453125, 0.038478851318359375, 0.0417938232421875, 0.045108795166015625, 0.04842376708984375, 0.051738739013671875, 0.0550537109375, 0.058368682861328125, 0.06168365478515625, 0.06499862670898438, 0.0683135986328125, 0.07162857055664062, 0.07494354248046875, 0.07825851440429688, 0.081573486328125, 0.08488845825195312, 0.08820343017578125, 0.09151840209960938, 0.0948333740234375, 0.09814834594726562, 0.10146331787109375, 0.10477828979492188, 0.10809326171875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 4.0, 2.0, 5.0, 6.0, 4.0, 7.0, 8.0, 17.0, 13.0, 16.0, 26.0, 30.0, 43.0, 58.0, 79.0, 123.0, 103.0, 107.0, 102.0, 55.0, 42.0, 38.0, 24.0, 11.0, 14.0, 11.0, 5.0, 11.0, 6.0, 5.0, 3.0, 3.0, 2.0, 7.0, 2.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.0247039794921875, -0.023903608322143555, -0.02310323715209961, -0.022302865982055664, -0.02150249481201172, -0.020702123641967773, -0.019901752471923828, -0.019101381301879883, -0.018301010131835938, -0.017500638961791992, -0.016700267791748047, -0.0158998966217041, -0.015099525451660156, -0.014299154281616211, -0.013498783111572266, -0.01269841194152832, -0.011898040771484375, -0.01109766960144043, -0.010297298431396484, -0.009496927261352539, -0.008696556091308594, -0.007896184921264648, -0.007095813751220703, -0.006295442581176758, -0.0054950714111328125, -0.004694700241088867, -0.003894329071044922, -0.0030939579010009766, -0.0022935867309570312, -0.001493215560913086, -0.0006928443908691406, 0.00010752677917480469, 0.00090789794921875, 0.0017082691192626953, 0.0025086402893066406, 0.003309011459350586, 0.004109382629394531, 0.0049097537994384766, 0.005710124969482422, 0.006510496139526367, 0.0073108673095703125, 0.008111238479614258, 0.008911609649658203, 0.009711980819702148, 0.010512351989746094, 0.011312723159790039, 0.012113094329833984, 0.01291346549987793, 0.013713836669921875, 0.01451420783996582, 0.015314579010009766, 0.01611495018005371, 0.016915321350097656, 0.0177156925201416, 0.018516063690185547, 0.019316434860229492, 0.020116806030273438, 0.020917177200317383, 0.021717548370361328, 0.022517919540405273, 0.02331829071044922, 0.024118661880493164, 0.02491903305053711, 0.025719404220581055, 0.026519775390625]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 1.0, 4.0, 16.0, 42.0, 75.0, 167.0, 244.0, 219.0, 135.0, 70.0, 22.0, 10.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.225727081298828, -10.974468231201172, -10.7232084274292, -10.471949577331543, -10.220690727233887, -9.969430923461914, -9.718172073364258, -9.466913223266602, -9.215653419494629, -8.964394569396973, -8.713134765625, -8.461875915527344, -8.210617065429688, -7.959357261657715, -7.708098411560059, -7.456839084625244, -7.205580234527588, -6.954320907592773, -6.703062057495117, -6.451802730560303, -6.200543403625488, -5.949284553527832, -5.698025226593018, -5.446765899658203, -5.195507049560547, -4.944247722625732, -4.692988872528076, -4.441729545593262, -4.190470218658447, -3.939211130142212, -3.6879520416259766, -3.436692714691162, -3.1854333877563477, -2.9341742992401123, -2.682914972305298, -2.4316558837890625, -2.180396556854248, -1.9291374683380127, -1.6778783798217773, -1.4266191720962524, -1.1753599643707275, -0.9241007566452026, -0.6728416085243225, -0.4215824604034424, -0.17032325267791748, 0.08093595504760742, 0.3321950435638428, 0.5834542512893677, 0.8347134590148926, 1.0859726667404175, 1.3372318744659424, 1.5884909629821777, 1.8397501707077026, 2.0910093784332275, 2.342268466949463, 2.5935277938842773, 2.8447868824005127, 3.096045970916748, 3.3473052978515625, 3.598564386367798, 3.849823474884033, 4.101082801818848, 4.352341651916504, 4.603600978851318, 4.854860305786133]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 5.0, 7.0, 6.0, 17.0, 30.0, 33.0, 36.0, 46.0, 45.0, 66.0, 65.0, 96.0, 85.0, 71.0, 94.0, 80.0, 44.0, 42.0, 43.0, 34.0, 27.0, 14.0, 12.0, 3.0, 1.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.771545886993408, -3.659273624420166, -3.547001361846924, -3.4347290992736816, -3.3224568367004395, -3.2101845741271973, -3.097912311553955, -2.985640048980713, -2.8733677864074707, -2.7610955238342285, -2.6488232612609863, -2.536550998687744, -2.424278736114502, -2.3120064735412598, -2.1997342109680176, -2.0874619483947754, -1.9751899242401123, -1.8629176616668701, -1.750645399093628, -1.6383731365203857, -1.5261008739471436, -1.4138286113739014, -1.3015564680099487, -1.1892842054367065, -1.0770119428634644, -0.9647396802902222, -0.85246741771698, -0.7401952147483826, -0.6279229521751404, -0.5156506896018982, -0.4033784866333008, -0.2911062240600586, -0.1788339614868164, -0.06656171381473541, 0.04571053385734558, 0.15798276662826538, 0.27025502920150757, 0.38252729177474976, 0.49479949474334717, 0.6070717573165894, 0.7193440198898315, 0.8316162824630737, 0.9438885450363159, 1.0561606884002686, 1.1684329509735107, 1.280705213546753, 1.3929774761199951, 1.5052497386932373, 1.6175220012664795, 1.7297942638397217, 1.8420665264129639, 1.954338788986206, 2.0666110515594482, 2.1788833141326904, 2.2911553382873535, 2.4034276008605957, 2.515699863433838, 2.62797212600708, 2.7402443885803223, 2.8525166511535645, 2.9647889137268066, 3.077061176300049, 3.189333438873291, 3.301605701446533, 3.4138779640197754]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 5.0, 5.0, 10.0, 19.0, 34.0, 46.0, 91.0, 163.0, 370.0, 752.0, 2299.0, 6714.0, 23156.0, 89616.0, 402289.0, 400073.0, 89881.0, 22710.0, 6522.0, 2100.0, 883.0, 384.0, 176.0, 101.0, 68.0, 28.0, 19.0, 15.0, 12.0, 2.0, 0.0, 4.0, 3.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.892578125, -2.812225341796875, -2.73187255859375, -2.651519775390625, -2.5711669921875, -2.490814208984375, -2.41046142578125, -2.330108642578125, -2.249755859375, -2.169403076171875, -2.08905029296875, -2.008697509765625, -1.9283447265625, -1.847991943359375, -1.76763916015625, -1.687286376953125, -1.60693359375, -1.526580810546875, -1.44622802734375, -1.365875244140625, -1.2855224609375, -1.205169677734375, -1.12481689453125, -1.044464111328125, -0.964111328125, -0.883758544921875, -0.80340576171875, -0.723052978515625, -0.6427001953125, -0.562347412109375, -0.48199462890625, -0.401641845703125, -0.3212890625, -0.240936279296875, -0.16058349609375, -0.080230712890625, 0.0001220703125, 0.080474853515625, 0.16082763671875, 0.241180419921875, 0.321533203125, 0.401885986328125, 0.48223876953125, 0.562591552734375, 0.6429443359375, 0.723297119140625, 0.80364990234375, 0.884002685546875, 0.96435546875, 1.044708251953125, 1.12506103515625, 1.205413818359375, 1.2857666015625, 1.366119384765625, 1.44647216796875, 1.526824951171875, 1.607177734375, 1.687530517578125, 1.76788330078125, 1.848236083984375, 1.9285888671875, 2.008941650390625, 2.08929443359375, 2.169647216796875, 2.25]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 5.0, 6.0, 7.0, 5.0, 8.0, 15.0, 11.0, 26.0, 29.0, 22.0, 33.0, 45.0, 42.0, 37.0, 61.0, 53.0, 62.0, 58.0, 68.0, 56.0, 61.0, 52.0, 42.0, 43.0, 36.0, 24.0, 25.0, 23.0, 20.0, 13.0, 7.0, 4.0, 5.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.04296875, -5.8858642578125, -5.728759765625, -5.5716552734375, -5.41455078125, -5.2574462890625, -5.100341796875, -4.9432373046875, -4.7861328125, -4.6290283203125, -4.471923828125, -4.3148193359375, -4.15771484375, -4.0006103515625, -3.843505859375, -3.6864013671875, -3.529296875, -3.3721923828125, -3.215087890625, -3.0579833984375, -2.90087890625, -2.7437744140625, -2.586669921875, -2.4295654296875, -2.2724609375, -2.1153564453125, -1.958251953125, -1.8011474609375, -1.64404296875, -1.4869384765625, -1.329833984375, -1.1727294921875, -1.015625, -0.8585205078125, -0.701416015625, -0.5443115234375, -0.38720703125, -0.2301025390625, -0.072998046875, 0.0841064453125, 0.2412109375, 0.3983154296875, 0.555419921875, 0.7125244140625, 0.86962890625, 1.0267333984375, 1.183837890625, 1.3409423828125, 1.498046875, 1.6551513671875, 1.812255859375, 1.9693603515625, 2.12646484375, 2.2835693359375, 2.440673828125, 2.5977783203125, 2.7548828125, 2.9119873046875, 3.069091796875, 3.2261962890625, 3.38330078125, 3.5404052734375, 3.697509765625, 3.8546142578125, 4.01171875]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 4.0, 1.0, 4.0, 5.0, 3.0, 6.0, 9.0, 7.0, 16.0, 6.0, 30.0, 18.0, 20.0, 23.0, 22.0, 41.0, 23.0, 39.0, 58.0, 83.0, 197.0, 1032.0, 291205.0, 753598.0, 1439.0, 233.0, 86.0, 48.0, 44.0, 38.0, 38.0, 25.0, 32.0, 16.0, 20.0, 15.0, 10.0, 11.0, 15.0, 6.0, 11.0, 1.0, 5.0, 4.0, 4.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-16.640625, -16.166015625, -15.69140625, -15.216796875, -14.7421875, -14.267578125, -13.79296875, -13.318359375, -12.84375, -12.369140625, -11.89453125, -11.419921875, -10.9453125, -10.470703125, -9.99609375, -9.521484375, -9.046875, -8.572265625, -8.09765625, -7.623046875, -7.1484375, -6.673828125, -6.19921875, -5.724609375, -5.25, -4.775390625, -4.30078125, -3.826171875, -3.3515625, -2.876953125, -2.40234375, -1.927734375, -1.453125, -0.978515625, -0.50390625, -0.029296875, 0.4453125, 0.919921875, 1.39453125, 1.869140625, 2.34375, 2.818359375, 3.29296875, 3.767578125, 4.2421875, 4.716796875, 5.19140625, 5.666015625, 6.140625, 6.615234375, 7.08984375, 7.564453125, 8.0390625, 8.513671875, 8.98828125, 9.462890625, 9.9375, 10.412109375, 10.88671875, 11.361328125, 11.8359375, 12.310546875, 12.78515625, 13.259765625, 13.734375]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 0.0, 3.0, 7.0, 10.0, 2.0, 3.0, 14.0, 13.0, 10.0, 26.0, 15.0, 33.0, 15.0, 37.0, 31.0, 36.0, 35.0, 41.0, 40.0, 46.0, 56.0, 37.0, 53.0, 57.0, 44.0, 46.0, 39.0, 29.0, 38.0, 35.0, 23.0, 30.0, 11.0, 25.0, 14.0, 10.0, 10.0, 9.0, 4.0, 3.0, 3.0, 2.0, 4.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.734375, -4.601226806640625, -4.46807861328125, -4.334930419921875, -4.2017822265625, -4.068634033203125, -3.93548583984375, -3.802337646484375, -3.669189453125, -3.536041259765625, -3.40289306640625, -3.269744873046875, -3.1365966796875, -3.003448486328125, -2.87030029296875, -2.737152099609375, -2.60400390625, -2.470855712890625, -2.33770751953125, -2.204559326171875, -2.0714111328125, -1.938262939453125, -1.80511474609375, -1.671966552734375, -1.538818359375, -1.405670166015625, -1.27252197265625, -1.139373779296875, -1.0062255859375, -0.873077392578125, -0.73992919921875, -0.606781005859375, -0.4736328125, -0.340484619140625, -0.20733642578125, -0.074188232421875, 0.0589599609375, 0.192108154296875, 0.32525634765625, 0.458404541015625, 0.591552734375, 0.724700927734375, 0.85784912109375, 0.990997314453125, 1.1241455078125, 1.257293701171875, 1.39044189453125, 1.523590087890625, 1.65673828125, 1.789886474609375, 1.92303466796875, 2.056182861328125, 2.1893310546875, 2.322479248046875, 2.45562744140625, 2.588775634765625, 2.721923828125, 2.855072021484375, 2.98822021484375, 3.121368408203125, 3.2545166015625, 3.387664794921875, 3.52081298828125, 3.653961181640625, 3.787109375]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 6.0, 8.0, 15.0, 23.0, 21.0, 43.0, 72.0, 135.0, 345.0, 1568.0, 11131.0, 511364.0, 510368.0, 11083.0, 1574.0, 433.0, 151.0, 71.0, 51.0, 31.0, 13.0, 12.0, 9.0, 6.0, 7.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-2.6953125, -2.622467041015625, -2.54962158203125, -2.476776123046875, -2.4039306640625, -2.331085205078125, -2.25823974609375, -2.185394287109375, -2.112548828125, -2.039703369140625, -1.96685791015625, -1.894012451171875, -1.8211669921875, -1.748321533203125, -1.67547607421875, -1.602630615234375, -1.52978515625, -1.456939697265625, -1.38409423828125, -1.311248779296875, -1.2384033203125, -1.165557861328125, -1.09271240234375, -1.019866943359375, -0.947021484375, -0.874176025390625, -0.80133056640625, -0.728485107421875, -0.6556396484375, -0.582794189453125, -0.50994873046875, -0.437103271484375, -0.3642578125, -0.291412353515625, -0.21856689453125, -0.145721435546875, -0.0728759765625, -3.0517578125e-05, 0.07281494140625, 0.145660400390625, 0.218505859375, 0.291351318359375, 0.36419677734375, 0.437042236328125, 0.5098876953125, 0.582733154296875, 0.65557861328125, 0.728424072265625, 0.80126953125, 0.874114990234375, 0.94696044921875, 1.019805908203125, 1.0926513671875, 1.165496826171875, 1.23834228515625, 1.311187744140625, 1.384033203125, 1.456878662109375, 1.52972412109375, 1.602569580078125, 1.6754150390625, 1.748260498046875, 1.82110595703125, 1.893951416015625, 1.966796875]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 6.0, 3.0, 3.0, 7.0, 18.0, 19.0, 26.0, 47.0, 62.0, 72.0, 117.0, 119.0, 120.0, 87.0, 80.0, 54.0, 50.0, 30.0, 20.0, 23.0, 12.0, 7.0, 5.0, 4.0, 3.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00016820430755615234, -0.00016312859952449799, -0.00015805289149284363, -0.00015297718346118927, -0.0001479014754295349, -0.00014282576739788055, -0.0001377500593662262, -0.00013267435133457184, -0.00012759864330291748, -0.00012252293527126312, -0.00011744722723960876, -0.0001123715192079544, -0.00010729581117630005, -0.00010222010314464569, -9.714439511299133e-05, -9.206868708133698e-05, -8.699297904968262e-05, -8.191727101802826e-05, -7.68415629863739e-05, -7.176585495471954e-05, -6.669014692306519e-05, -6.161443889141083e-05, -5.653873085975647e-05, -5.146302282810211e-05, -4.6387314796447754e-05, -4.1311606764793396e-05, -3.623589873313904e-05, -3.116019070148468e-05, -2.6084482669830322e-05, -2.1008774638175964e-05, -1.5933066606521606e-05, -1.0857358574867249e-05, -5.781650543212891e-06, -7.059425115585327e-07, 4.369765520095825e-06, 9.445473551750183e-06, 1.4521181583404541e-05, 1.95968896150589e-05, 2.4672597646713257e-05, 2.9748305678367615e-05, 3.482401371002197e-05, 3.989972174167633e-05, 4.497542977333069e-05, 5.0051137804985046e-05, 5.5126845836639404e-05, 6.020255386829376e-05, 6.527826189994812e-05, 7.035396993160248e-05, 7.542967796325684e-05, 8.05053859949112e-05, 8.558109402656555e-05, 9.065680205821991e-05, 9.573251008987427e-05, 0.00010080821812152863, 0.00010588392615318298, 0.00011095963418483734, 0.0001160353422164917, 0.00012111105024814606, 0.00012618675827980042, 0.00013126246631145477, 0.00013633817434310913, 0.0001414138823747635, 0.00014648959040641785, 0.0001515652984380722, 0.00015664100646972656]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 7.0, 2.0, 2.0, 3.0, 5.0, 5.0, 6.0, 11.0, 16.0, 20.0, 20.0, 33.0, 76.0, 113.0, 215.0, 424.0, 924.0, 2526.0, 9247.0, 59905.0, 533726.0, 389010.0, 40970.0, 7393.0, 2179.0, 833.0, 386.0, 204.0, 124.0, 55.0, 32.0, 21.0, 13.0, 12.0, 9.0, 9.0, 4.0, 8.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-1.2900390625, -1.2519989013671875, -1.213958740234375, -1.1759185791015625, -1.13787841796875, -1.0998382568359375, -1.061798095703125, -1.0237579345703125, -0.9857177734375, -0.9476776123046875, -0.909637451171875, -0.8715972900390625, -0.83355712890625, -0.7955169677734375, -0.757476806640625, -0.7194366455078125, -0.681396484375, -0.6433563232421875, -0.605316162109375, -0.5672760009765625, -0.52923583984375, -0.4911956787109375, -0.453155517578125, -0.4151153564453125, -0.3770751953125, -0.3390350341796875, -0.300994873046875, -0.2629547119140625, -0.22491455078125, -0.1868743896484375, -0.148834228515625, -0.1107940673828125, -0.07275390625, -0.0347137451171875, 0.003326416015625, 0.0413665771484375, 0.07940673828125, 0.1174468994140625, 0.155487060546875, 0.1935272216796875, 0.2315673828125, 0.2696075439453125, 0.307647705078125, 0.3456878662109375, 0.38372802734375, 0.4217681884765625, 0.459808349609375, 0.4978485107421875, 0.535888671875, 0.5739288330078125, 0.611968994140625, 0.6500091552734375, 0.68804931640625, 0.7260894775390625, 0.764129638671875, 0.8021697998046875, 0.8402099609375, 0.8782501220703125, 0.916290283203125, 0.9543304443359375, 0.99237060546875, 1.0304107666015625, 1.068450927734375, 1.1064910888671875, 1.14453125]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [5.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 3.0, 9.0, 13.0, 15.0, 20.0, 27.0, 35.0, 58.0, 81.0, 120.0, 118.0, 120.0, 113.0, 70.0, 51.0, 44.0, 27.0, 23.0, 7.0, 14.0, 4.0, 11.0, 3.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.390380859375, -0.3740882873535156, -0.35779571533203125, -0.3415031433105469, -0.3252105712890625, -0.3089179992675781, -0.29262542724609375, -0.2763328552246094, -0.260040283203125, -0.24374771118164062, -0.22745513916015625, -0.21116256713867188, -0.1948699951171875, -0.17857742309570312, -0.16228485107421875, -0.14599227905273438, -0.12969970703125, -0.11340713500976562, -0.09711456298828125, -0.08082199096679688, -0.0645294189453125, -0.048236846923828125, -0.03194427490234375, -0.015651702880859375, 0.000640869140625, 0.016933441162109375, 0.03322601318359375, 0.049518585205078125, 0.0658111572265625, 0.08210372924804688, 0.09839630126953125, 0.11468887329101562, 0.1309814453125, 0.14727401733398438, 0.16356658935546875, 0.17985916137695312, 0.1961517333984375, 0.21244430541992188, 0.22873687744140625, 0.24502944946289062, 0.261322021484375, 0.2776145935058594, 0.29390716552734375, 0.3101997375488281, 0.3264923095703125, 0.3427848815917969, 0.35907745361328125, 0.3753700256347656, 0.39166259765625, 0.4079551696777344, 0.42424774169921875, 0.4405403137207031, 0.4568328857421875, 0.4731254577636719, 0.48941802978515625, 0.5057106018066406, 0.522003173828125, 0.5382957458496094, 0.5545883178710938, 0.5708808898925781, 0.5871734619140625, 0.6034660339355469, 0.6197586059570312, 0.6360511779785156, 0.65234375]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 2.0, 5.0, 10.0, 15.0, 32.0, 111.0, 174.0, 230.0, 205.0, 130.0, 59.0, 23.0, 10.0, 4.0, 3.0, 0.0, 1.0], "bins": [-25.567317962646484, -25.098392486572266, -24.629467010498047, -24.160541534423828, -23.69161605834961, -23.22269058227539, -22.753765106201172, -22.284839630126953, -21.815914154052734, -21.346988677978516, -20.878063201904297, -20.409137725830078, -19.94021224975586, -19.47128677368164, -19.002361297607422, -18.533435821533203, -18.064510345458984, -17.595584869384766, -17.126659393310547, -16.657733917236328, -16.18880844116211, -15.71988296508789, -15.250957489013672, -14.782032012939453, -14.31310749053955, -13.844182014465332, -13.375256538391113, -12.906331062316895, -12.437405586242676, -11.968480110168457, -11.499554634094238, -11.03062915802002, -10.561702728271484, -10.092777252197266, -9.623851776123047, -9.154926300048828, -8.68600082397461, -8.21707534790039, -7.748149871826172, -7.279224395751953, -6.810299873352051, -6.341374397277832, -5.872448921203613, -5.4035234451293945, -4.934597969055176, -4.465672492980957, -3.9967472553253174, -3.5278217792510986, -3.058896064758301, -2.589970588684082, -2.1210451126098633, -1.652119755744934, -1.1831942796707153, -0.7142689228057861, -0.24534344673156738, 0.22358202934265137, 0.6925075054168701, 1.1614329814910889, 1.6303584575653076, 2.0992836952209473, 2.568209171295166, 3.0371346473693848, 3.5060601234436035, 3.9749855995178223, 4.443911075592041]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 6.0, 2.0, 9.0, 12.0, 8.0, 14.0, 12.0, 18.0, 14.0, 18.0, 24.0, 28.0, 36.0, 28.0, 41.0, 37.0, 40.0, 42.0, 44.0, 39.0, 38.0, 48.0, 45.0, 37.0, 55.0, 36.0, 28.0, 36.0, 20.0, 31.0, 29.0, 26.0, 19.0, 15.0, 12.0, 11.0, 8.0, 11.0, 8.0, 3.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0], "bins": [-6.464783668518066, -6.28306770324707, -6.101352214813232, -5.919636249542236, -5.73792028427124, -5.556204795837402, -5.374488830566406, -5.19277286529541, -5.011057376861572, -4.829341411590576, -4.647625923156738, -4.465909957885742, -4.284193992614746, -4.102478504180908, -3.920762538909912, -3.739046812057495, -3.557330846786499, -3.375615119934082, -3.193899154663086, -3.012183427810669, -2.830467700958252, -2.648751735687256, -2.467036008834839, -2.285320281982422, -2.103604316711426, -1.9218884706497192, -1.7401727437973022, -1.5584568977355957, -1.3767411708831787, -1.1950253248214722, -1.0133094787597656, -0.8315937519073486, -0.6498780250549316, -0.4681622385978699, -0.2864464223384857, -0.10473060607910156, 0.0769851803779602, 0.258700966835022, 0.4404168128967285, 0.6221325397491455, 0.803848385810852, 0.9855641722679138, 1.1672799587249756, 1.3489958047866821, 1.5307116508483887, 1.7124273777008057, 1.8941432237625122, 2.0758590698242188, 2.2575747966766357, 2.4392905235290527, 2.621006488800049, 2.802722215652466, 2.984437942504883, 3.166153907775879, 3.347869634628296, 3.529585361480713, 3.711301326751709, 3.893017053604126, 4.074732780456543, 4.256448745727539, 4.438164710998535, 4.619880199432373, 4.801596164703369, 4.983311653137207, 5.165027618408203]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 8.0, 7.0, 4.0, 8.0, 9.0, 11.0, 17.0, 18.0, 24.0, 30.0, 38.0, 72.0, 88.0, 146.0, 210.0, 356.0, 590.0, 1460.0, 3671.0, 12685.0, 58948.0, 346837.0, 1573494.0, 1685918.0, 413126.0, 72496.0, 16197.0, 4838.0, 1577.0, 658.0, 332.0, 141.0, 100.0, 60.0, 27.0, 25.0, 11.0, 14.0, 11.0, 3.0, 7.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.8046875, -3.68597412109375, -3.5672607421875, -3.44854736328125, -3.329833984375, -3.21112060546875, -3.0924072265625, -2.97369384765625, -2.85498046875, -2.73626708984375, -2.6175537109375, -2.49884033203125, -2.380126953125, -2.26141357421875, -2.1427001953125, -2.02398681640625, -1.9052734375, -1.78656005859375, -1.6678466796875, -1.54913330078125, -1.430419921875, -1.31170654296875, -1.1929931640625, -1.07427978515625, -0.95556640625, -0.83685302734375, -0.7181396484375, -0.59942626953125, -0.480712890625, -0.36199951171875, -0.2432861328125, -0.12457275390625, -0.005859375, 0.11285400390625, 0.2315673828125, 0.35028076171875, 0.468994140625, 0.58770751953125, 0.7064208984375, 0.82513427734375, 0.94384765625, 1.06256103515625, 1.1812744140625, 1.29998779296875, 1.418701171875, 1.53741455078125, 1.6561279296875, 1.77484130859375, 1.8935546875, 2.01226806640625, 2.1309814453125, 2.24969482421875, 2.368408203125, 2.48712158203125, 2.6058349609375, 2.72454833984375, 2.84326171875, 2.96197509765625, 3.0806884765625, 3.19940185546875, 3.318115234375, 3.43682861328125, 3.5555419921875, 3.67425537109375, 3.79296875]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 4.0, 12.0, 7.0, 12.0, 12.0, 23.0, 38.0, 29.0, 36.0, 45.0, 43.0, 53.0, 52.0, 60.0, 62.0, 62.0, 63.0, 66.0, 58.0, 41.0, 42.0, 32.0, 30.0, 30.0, 29.0, 11.0, 20.0, 7.0, 7.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-4.4296875, -4.31591796875, -4.2021484375, -4.08837890625, -3.974609375, -3.86083984375, -3.7470703125, -3.63330078125, -3.51953125, -3.40576171875, -3.2919921875, -3.17822265625, -3.064453125, -2.95068359375, -2.8369140625, -2.72314453125, -2.609375, -2.49560546875, -2.3818359375, -2.26806640625, -2.154296875, -2.04052734375, -1.9267578125, -1.81298828125, -1.69921875, -1.58544921875, -1.4716796875, -1.35791015625, -1.244140625, -1.13037109375, -1.0166015625, -0.90283203125, -0.7890625, -0.67529296875, -0.5615234375, -0.44775390625, -0.333984375, -0.22021484375, -0.1064453125, 0.00732421875, 0.12109375, 0.23486328125, 0.3486328125, 0.46240234375, 0.576171875, 0.68994140625, 0.8037109375, 0.91748046875, 1.03125, 1.14501953125, 1.2587890625, 1.37255859375, 1.486328125, 1.60009765625, 1.7138671875, 1.82763671875, 1.94140625, 2.05517578125, 2.1689453125, 2.28271484375, 2.396484375, 2.51025390625, 2.6240234375, 2.73779296875, 2.8515625]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 7.0, 12.0, 12.0, 32.0, 39.0, 60.0, 117.0, 274.0, 783.0, 3179.0, 27585.0, 1230181.0, 2863241.0, 61169.0, 5464.0, 1252.0, 422.0, 188.0, 99.0, 53.0, 32.0, 21.0, 21.0, 12.0, 4.0, 6.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.49609375, -5.26824951171875, -5.0404052734375, -4.81256103515625, -4.584716796875, -4.35687255859375, -4.1290283203125, -3.90118408203125, -3.67333984375, -3.44549560546875, -3.2176513671875, -2.98980712890625, -2.761962890625, -2.53411865234375, -2.3062744140625, -2.07843017578125, -1.8505859375, -1.62274169921875, -1.3948974609375, -1.16705322265625, -0.939208984375, -0.71136474609375, -0.4835205078125, -0.25567626953125, -0.02783203125, 0.20001220703125, 0.4278564453125, 0.65570068359375, 0.883544921875, 1.11138916015625, 1.3392333984375, 1.56707763671875, 1.794921875, 2.02276611328125, 2.2506103515625, 2.47845458984375, 2.706298828125, 2.93414306640625, 3.1619873046875, 3.38983154296875, 3.61767578125, 3.84552001953125, 4.0733642578125, 4.30120849609375, 4.529052734375, 4.75689697265625, 4.9847412109375, 5.21258544921875, 5.4404296875, 5.66827392578125, 5.8961181640625, 6.12396240234375, 6.351806640625, 6.57965087890625, 6.8074951171875, 7.03533935546875, 7.26318359375, 7.49102783203125, 7.7188720703125, 7.94671630859375, 8.174560546875, 8.40240478515625, 8.6302490234375, 8.85809326171875, 9.0859375]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 3.0, 3.0, 7.0, 8.0, 6.0, 15.0, 26.0, 32.0, 71.0, 102.0, 163.0, 245.0, 425.0, 547.0, 685.0, 638.0, 450.0, 264.0, 144.0, 98.0, 56.0, 35.0, 19.0, 14.0, 5.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.21484375, -2.15740966796875, -2.0999755859375, -2.04254150390625, -1.985107421875, -1.92767333984375, -1.8702392578125, -1.81280517578125, -1.75537109375, -1.69793701171875, -1.6405029296875, -1.58306884765625, -1.525634765625, -1.46820068359375, -1.4107666015625, -1.35333251953125, -1.2958984375, -1.23846435546875, -1.1810302734375, -1.12359619140625, -1.066162109375, -1.00872802734375, -0.9512939453125, -0.89385986328125, -0.83642578125, -0.77899169921875, -0.7215576171875, -0.66412353515625, -0.606689453125, -0.54925537109375, -0.4918212890625, -0.43438720703125, -0.376953125, -0.31951904296875, -0.2620849609375, -0.20465087890625, -0.147216796875, -0.08978271484375, -0.0323486328125, 0.02508544921875, 0.08251953125, 0.13995361328125, 0.1973876953125, 0.25482177734375, 0.312255859375, 0.36968994140625, 0.4271240234375, 0.48455810546875, 0.5419921875, 0.59942626953125, 0.6568603515625, 0.71429443359375, 0.771728515625, 0.82916259765625, 0.8865966796875, 0.94403076171875, 1.00146484375, 1.05889892578125, 1.1163330078125, 1.17376708984375, 1.231201171875, 1.28863525390625, 1.3460693359375, 1.40350341796875, 1.4609375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 6.0, 15.0, 18.0, 29.0, 58.0, 64.0, 77.0, 94.0, 108.0, 112.0, 113.0, 84.0, 72.0, 53.0, 39.0, 16.0, 15.0, 12.0, 8.0, 9.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.956422805786133, -5.767917633056641, -5.579412460327148, -5.390907287597656, -5.202401638031006, -5.013896465301514, -4.8253912925720215, -4.636886119842529, -4.448380470275879, -4.259875297546387, -4.0713701248168945, -3.8828647136688232, -3.694359302520752, -3.5058541297912598, -3.3173489570617676, -3.1288437843322754, -2.940338611602783, -2.751833438873291, -2.5633280277252197, -2.3748228549957275, -2.1863174438476562, -1.997812271118164, -1.8093070983886719, -1.6208018064498901, -1.4322965145111084, -1.2437912225723267, -1.055285930633545, -0.8667807579040527, -0.678275465965271, -0.48977017402648926, -0.30126500129699707, -0.11275970935821533, 0.0757455825805664, 0.26425084471702576, 0.4527561068534851, 0.6412613391876221, 0.8297666311264038, 1.0182719230651855, 1.2067770957946777, 1.3952823877334595, 1.5837876796722412, 1.772292971611023, 1.9607982635498047, 2.149303436279297, 2.337808609008789, 2.5263140201568604, 2.7148191928863525, 2.903324604034424, 3.091829776763916, 3.280334949493408, 3.4688403606414795, 3.6573455333709717, 3.845850944519043, 4.034356117248535, 4.222861289978027, 4.4113664627075195, 4.599871635437012, 4.788376808166504, 4.976881980895996, 5.165387153625488, 5.353892803192139, 5.542397975921631, 5.730903148651123, 5.919408321380615, 6.107913970947266]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 7.0, 2.0, 16.0, 10.0, 16.0, 17.0, 15.0, 26.0, 29.0, 24.0, 28.0, 43.0, 44.0, 39.0, 48.0, 54.0, 49.0, 56.0, 59.0, 53.0, 49.0, 47.0, 43.0, 41.0, 42.0, 29.0, 29.0, 18.0, 15.0, 8.0, 9.0, 10.0, 4.0, 9.0, 7.0, 7.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.940107822418213, -2.830690383911133, -2.7212727069854736, -2.6118552684783936, -2.5024375915527344, -2.3930201530456543, -2.283602476119995, -2.174185037612915, -2.064767360687256, -1.9553498029708862, -1.8459322452545166, -1.736514687538147, -1.6270971298217773, -1.5176796913146973, -1.408262014389038, -1.298844575881958, -1.1894270181655884, -1.0800094604492188, -0.9705919027328491, -0.8611743450164795, -0.7517567873001099, -0.642339289188385, -0.5329217314720154, -0.42350417375564575, -0.3140866160392761, -0.2046690583229065, -0.09525151550769806, 0.014166027307510376, 0.12358358502388, 0.23300111293792725, 0.3424186706542969, 0.4518362283706665, 0.5612537860870361, 0.6706713438034058, 0.7800889015197754, 0.889506459236145, 0.9989240169525146, 1.1083414554595947, 1.217759132385254, 1.327176570892334, 1.4365942478179932, 1.5460118055343628, 1.6554293632507324, 1.764846920967102, 1.8742644786834717, 1.9836819171905518, 2.093099594116211, 2.202517032623291, 2.311934471130371, 2.421351909637451, 2.5307695865631104, 2.6401870250701904, 2.7496047019958496, 2.8590221405029297, 2.968439817428589, 3.077857255935669, 3.187274932861328, 3.296692371368408, 3.4061100482940674, 3.5155274868011475, 3.6249451637268066, 3.7343626022338867, 3.843780279159546, 3.953197717666626, 4.062615394592285]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 7.0, 7.0, 4.0, 10.0, 19.0, 22.0, 34.0, 54.0, 73.0, 144.0, 191.0, 383.0, 735.0, 1536.0, 4113.0, 14228.0, 77519.0, 475158.0, 396329.0, 59595.0, 11853.0, 3564.0, 1467.0, 646.0, 339.0, 203.0, 119.0, 63.0, 40.0, 36.0, 16.0, 19.0, 12.0, 10.0, 3.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.89404296875, -0.8641738891601562, -0.8343048095703125, -0.8044357299804688, -0.774566650390625, -0.7446975708007812, -0.7148284912109375, -0.6849594116210938, -0.65509033203125, -0.6252212524414062, -0.5953521728515625, -0.5654830932617188, -0.535614013671875, -0.5057449340820312, -0.4758758544921875, -0.44600677490234375, -0.4161376953125, -0.38626861572265625, -0.3563995361328125, -0.32653045654296875, -0.296661376953125, -0.26679229736328125, -0.2369232177734375, -0.20705413818359375, -0.17718505859375, -0.14731597900390625, -0.1174468994140625, -0.08757781982421875, -0.057708740234375, -0.02783966064453125, 0.0020294189453125, 0.03189849853515625, 0.061767578125, 0.09163665771484375, 0.1215057373046875, 0.15137481689453125, 0.181243896484375, 0.21111297607421875, 0.2409820556640625, 0.27085113525390625, 0.30072021484375, 0.33058929443359375, 0.3604583740234375, 0.39032745361328125, 0.420196533203125, 0.45006561279296875, 0.4799346923828125, 0.5098037719726562, 0.5396728515625, 0.5695419311523438, 0.5994110107421875, 0.6292800903320312, 0.659149169921875, 0.6890182495117188, 0.7188873291015625, 0.7487564086914062, 0.77862548828125, 0.8084945678710938, 0.8383636474609375, 0.8682327270507812, 0.898101806640625, 0.9279708862304688, 0.9578399658203125, 0.9877090454101562, 1.017578125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 4.0, 4.0, 5.0, 6.0, 14.0, 13.0, 17.0, 17.0, 29.0, 23.0, 26.0, 40.0, 40.0, 55.0, 70.0, 55.0, 62.0, 69.0, 66.0, 48.0, 66.0, 56.0, 44.0, 33.0, 38.0, 25.0, 14.0, 17.0, 16.0, 7.0, 12.0, 5.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.384765625, -2.305694580078125, -2.22662353515625, -2.147552490234375, -2.0684814453125, -1.989410400390625, -1.91033935546875, -1.831268310546875, -1.752197265625, -1.673126220703125, -1.59405517578125, -1.514984130859375, -1.4359130859375, -1.356842041015625, -1.27777099609375, -1.198699951171875, -1.11962890625, -1.040557861328125, -0.96148681640625, -0.882415771484375, -0.8033447265625, -0.724273681640625, -0.64520263671875, -0.566131591796875, -0.487060546875, -0.407989501953125, -0.32891845703125, -0.249847412109375, -0.1707763671875, -0.091705322265625, -0.01263427734375, 0.066436767578125, 0.1455078125, 0.224578857421875, 0.30364990234375, 0.382720947265625, 0.4617919921875, 0.540863037109375, 0.61993408203125, 0.699005126953125, 0.778076171875, 0.857147216796875, 0.93621826171875, 1.015289306640625, 1.0943603515625, 1.173431396484375, 1.25250244140625, 1.331573486328125, 1.41064453125, 1.489715576171875, 1.56878662109375, 1.647857666015625, 1.7269287109375, 1.805999755859375, 1.88507080078125, 1.964141845703125, 2.043212890625, 2.122283935546875, 2.20135498046875, 2.280426025390625, 2.3594970703125, 2.438568115234375, 2.51763916015625, 2.596710205078125, 2.67578125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 5.0, 2.0, 3.0, 16.0, 13.0, 20.0, 36.0, 43.0, 64.0, 85.0, 134.0, 186.0, 292.0, 449.0, 660.0, 1018.0, 1697.0, 2762.0, 4760.0, 8155.0, 14503.0, 25756.0, 46362.0, 80455.0, 133482.0, 186912.0, 193619.0, 142246.0, 87785.0, 50552.0, 28363.0, 15705.0, 9046.0, 5199.0, 3043.0, 1774.0, 1157.0, 724.0, 474.0, 314.0, 196.0, 148.0, 93.0, 69.0, 50.0, 42.0, 28.0, 19.0, 18.0, 8.0, 6.0, 4.0, 6.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1903076171875, -0.1835308074951172, -0.17675399780273438, -0.16997718811035156, -0.16320037841796875, -0.15642356872558594, -0.14964675903320312, -0.1428699493408203, -0.1360931396484375, -0.1293163299560547, -0.12253952026367188, -0.11576271057128906, -0.10898590087890625, -0.10220909118652344, -0.09543228149414062, -0.08865547180175781, -0.081878662109375, -0.07510185241699219, -0.06832504272460938, -0.06154823303222656, -0.05477142333984375, -0.04799461364746094, -0.041217803955078125, -0.03444099426269531, -0.0276641845703125, -0.020887374877929688, -0.014110565185546875, -0.0073337554931640625, -0.00055694580078125, 0.0062198638916015625, 0.012996673583984375, 0.019773483276367188, 0.02655029296875, 0.03332710266113281, 0.040103912353515625, 0.04688072204589844, 0.05365753173828125, 0.06043434143066406, 0.06721115112304688, 0.07398796081542969, 0.0807647705078125, 0.08754158020019531, 0.09431838989257812, 0.10109519958496094, 0.10787200927734375, 0.11464881896972656, 0.12142562866210938, 0.1282024383544922, 0.134979248046875, 0.1417560577392578, 0.14853286743164062, 0.15530967712402344, 0.16208648681640625, 0.16886329650878906, 0.17564010620117188, 0.1824169158935547, 0.1891937255859375, 0.1959705352783203, 0.20274734497070312, 0.20952415466308594, 0.21630096435546875, 0.22307777404785156, 0.22985458374023438, 0.2366313934326172, 0.243408203125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 6.0, 1.0, 3.0, 7.0, 13.0, 13.0, 8.0, 22.0, 24.0, 25.0, 36.0, 34.0, 55.0, 52.0, 48.0, 45.0, 49.0, 57.0, 52.0, 46.0, 61.0, 61.0, 39.0, 46.0, 30.0, 38.0, 21.0, 24.0, 19.0, 13.0, 11.0, 15.0, 12.0, 2.0, 2.0, 5.0, 2.0, 3.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.51953125, -3.3895263671875, -3.259521484375, -3.1295166015625, -2.99951171875, -2.8695068359375, -2.739501953125, -2.6094970703125, -2.4794921875, -2.3494873046875, -2.219482421875, -2.0894775390625, -1.95947265625, -1.8294677734375, -1.699462890625, -1.5694580078125, -1.439453125, -1.3094482421875, -1.179443359375, -1.0494384765625, -0.91943359375, -0.7894287109375, -0.659423828125, -0.5294189453125, -0.3994140625, -0.2694091796875, -0.139404296875, -0.0093994140625, 0.12060546875, 0.2506103515625, 0.380615234375, 0.5106201171875, 0.640625, 0.7706298828125, 0.900634765625, 1.0306396484375, 1.16064453125, 1.2906494140625, 1.420654296875, 1.5506591796875, 1.6806640625, 1.8106689453125, 1.940673828125, 2.0706787109375, 2.20068359375, 2.3306884765625, 2.460693359375, 2.5906982421875, 2.720703125, 2.8507080078125, 2.980712890625, 3.1107177734375, 3.24072265625, 3.3707275390625, 3.500732421875, 3.6307373046875, 3.7607421875, 3.8907470703125, 4.020751953125, 4.1507568359375, 4.28076171875, 4.4107666015625, 4.540771484375, 4.6707763671875, 4.80078125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 0.0, 8.0, 2.0, 8.0, 17.0, 17.0, 22.0, 34.0, 53.0, 74.0, 101.0, 128.0, 241.0, 444.0, 1074.0, 2435.0, 7301.0, 25680.0, 109352.0, 388913.0, 373767.0, 103080.0, 24270.0, 6992.0, 2409.0, 970.0, 462.0, 246.0, 156.0, 95.0, 58.0, 35.0, 30.0, 30.0, 11.0, 11.0, 11.0, 7.0, 5.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.053436279296875, -0.051592350006103516, -0.04974842071533203, -0.04790449142456055, -0.04606056213378906, -0.04421663284301758, -0.042372703552246094, -0.04052877426147461, -0.038684844970703125, -0.03684091567993164, -0.034996986389160156, -0.03315305709838867, -0.03130912780761719, -0.029465198516845703, -0.02762126922607422, -0.025777339935302734, -0.02393341064453125, -0.022089481353759766, -0.02024555206298828, -0.018401622772216797, -0.016557693481445312, -0.014713764190673828, -0.012869834899902344, -0.01102590560913086, -0.009181976318359375, -0.007338047027587891, -0.005494117736816406, -0.003650188446044922, -0.0018062591552734375, 3.7670135498046875e-05, 0.0018815994262695312, 0.0037255287170410156, 0.0055694580078125, 0.007413387298583984, 0.009257316589355469, 0.011101245880126953, 0.012945175170898438, 0.014789104461669922, 0.016633033752441406, 0.01847696304321289, 0.020320892333984375, 0.02216482162475586, 0.024008750915527344, 0.025852680206298828, 0.027696609497070312, 0.029540538787841797, 0.03138446807861328, 0.033228397369384766, 0.03507232666015625, 0.036916255950927734, 0.03876018524169922, 0.0406041145324707, 0.04244804382324219, 0.04429197311401367, 0.046135902404785156, 0.04797983169555664, 0.049823760986328125, 0.05166769027709961, 0.053511619567871094, 0.05535554885864258, 0.05719947814941406, 0.05904340744018555, 0.06088733673095703, 0.06273126602172852, 0.0645751953125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 7.0, 7.0, 6.0, 6.0, 14.0, 13.0, 16.0, 19.0, 33.0, 28.0, 33.0, 59.0, 51.0, 79.0, 74.0, 79.0, 96.0, 76.0, 69.0, 55.0, 38.0, 37.0, 27.0, 23.0, 10.0, 13.0, 8.0, 8.0, 3.0, 6.0, 3.0, 5.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.8564205169677734e-05, -3.7445686757564545e-05, -3.6327168345451355e-05, -3.5208649933338165e-05, -3.4090131521224976e-05, -3.2971613109111786e-05, -3.1853094696998596e-05, -3.0734576284885406e-05, -2.9616057872772217e-05, -2.8497539460659027e-05, -2.7379021048545837e-05, -2.6260502636432648e-05, -2.5141984224319458e-05, -2.402346581220627e-05, -2.290494740009308e-05, -2.178642898797989e-05, -2.06679105758667e-05, -1.954939216375351e-05, -1.843087375164032e-05, -1.731235533952713e-05, -1.619383692741394e-05, -1.507531851530075e-05, -1.3956800103187561e-05, -1.2838281691074371e-05, -1.1719763278961182e-05, -1.0601244866847992e-05, -9.482726454734802e-06, -8.364208042621613e-06, -7.245689630508423e-06, -6.127171218395233e-06, -5.0086528062820435e-06, -3.890134394168854e-06, -2.771615982055664e-06, -1.6530975699424744e-06, -5.345791578292847e-07, 5.83939254283905e-07, 1.7024576663970947e-06, 2.8209760785102844e-06, 3.939494490623474e-06, 5.058012902736664e-06, 6.1765313148498535e-06, 7.295049726963043e-06, 8.413568139076233e-06, 9.532086551189423e-06, 1.0650604963302612e-05, 1.1769123375415802e-05, 1.2887641787528992e-05, 1.4006160199642181e-05, 1.5124678611755371e-05, 1.624319702386856e-05, 1.736171543598175e-05, 1.848023384809494e-05, 1.959875226020813e-05, 2.071727067232132e-05, 2.183578908443451e-05, 2.29543074965477e-05, 2.407282590866089e-05, 2.519134432077408e-05, 2.6309862732887268e-05, 2.7428381145000458e-05, 2.8546899557113647e-05, 2.9665417969226837e-05, 3.078393638134003e-05, 3.1902454793453217e-05, 3.3020973205566406e-05]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 5.0, 4.0, 3.0, 7.0, 8.0, 9.0, 26.0, 15.0, 46.0, 73.0, 121.0, 301.0, 567.0, 1286.0, 3625.0, 12683.0, 51074.0, 218736.0, 473928.0, 217270.0, 50340.0, 12302.0, 3627.0, 1362.0, 550.0, 266.0, 137.0, 66.0, 36.0, 18.0, 24.0, 7.0, 11.0, 4.0, 8.0, 3.0, 4.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.053253173828125, -0.05138444900512695, -0.049515724182128906, -0.04764699935913086, -0.04577827453613281, -0.043909549713134766, -0.04204082489013672, -0.04017210006713867, -0.038303375244140625, -0.03643465042114258, -0.03456592559814453, -0.032697200775146484, -0.030828475952148438, -0.02895975112915039, -0.027091026306152344, -0.025222301483154297, -0.02335357666015625, -0.021484851837158203, -0.019616127014160156, -0.01774740219116211, -0.015878677368164062, -0.014009952545166016, -0.012141227722167969, -0.010272502899169922, -0.008403778076171875, -0.006535053253173828, -0.004666328430175781, -0.0027976036071777344, -0.0009288787841796875, 0.0009398460388183594, 0.0028085708618164062, 0.004677295684814453, 0.0065460205078125, 0.008414745330810547, 0.010283470153808594, 0.01215219497680664, 0.014020919799804688, 0.015889644622802734, 0.01775836944580078, 0.019627094268798828, 0.021495819091796875, 0.023364543914794922, 0.02523326873779297, 0.027101993560791016, 0.028970718383789062, 0.03083944320678711, 0.032708168029785156, 0.0345768928527832, 0.03644561767578125, 0.0383143424987793, 0.040183067321777344, 0.04205179214477539, 0.04392051696777344, 0.045789241790771484, 0.04765796661376953, 0.04952669143676758, 0.051395416259765625, 0.05326414108276367, 0.05513286590576172, 0.057001590728759766, 0.05887031555175781, 0.06073904037475586, 0.0626077651977539, 0.06447649002075195, 0.06634521484375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 11.0, 13.0, 15.0, 17.0, 29.0, 49.0, 41.0, 71.0, 78.0, 130.0, 110.0, 94.0, 75.0, 69.0, 55.0, 41.0, 30.0, 27.0, 11.0, 8.0, 6.0, 4.0, 3.0, 3.0, 5.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.020660400390625, -0.019962310791015625, -0.01926422119140625, -0.018566131591796875, -0.0178680419921875, -0.017169952392578125, -0.01647186279296875, -0.015773773193359375, -0.01507568359375, -0.014377593994140625, -0.01367950439453125, -0.012981414794921875, -0.0122833251953125, -0.011585235595703125, -0.01088714599609375, -0.010189056396484375, -0.009490966796875, -0.008792877197265625, -0.00809478759765625, -0.007396697998046875, -0.0066986083984375, -0.006000518798828125, -0.00530242919921875, -0.004604339599609375, -0.00390625, -0.003208160400390625, -0.00251007080078125, -0.001811981201171875, -0.0011138916015625, -0.000415802001953125, 0.00028228759765625, 0.000980377197265625, 0.001678466796875, 0.002376556396484375, 0.00307464599609375, 0.003772735595703125, 0.0044708251953125, 0.005168914794921875, 0.00586700439453125, 0.006565093994140625, 0.00726318359375, 0.007961273193359375, 0.00865936279296875, 0.009357452392578125, 0.0100555419921875, 0.010753631591796875, 0.01145172119140625, 0.012149810791015625, 0.012847900390625, 0.013545989990234375, 0.01424407958984375, 0.014942169189453125, 0.0156402587890625, 0.016338348388671875, 0.01703643798828125, 0.017734527587890625, 0.0184326171875, 0.019130706787109375, 0.01982879638671875, 0.020526885986328125, 0.0212249755859375, 0.021923065185546875, 0.02262115478515625, 0.023319244384765625, 0.024017333984375]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 13.0, 50.0, 180.0, 310.0, 290.0, 115.0, 41.0, 8.0, 6.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.463403701782227, -4.141867637634277, -3.820331573486328, -3.498795509338379, -3.1772594451904297, -2.8557233810424805, -2.5341875553131104, -2.212651491165161, -1.891115427017212, -1.5695793628692627, -1.2480432987213135, -0.9265073537826538, -0.6049712896347046, -0.28343522548675537, 0.0381007194519043, 0.3596367835998535, 0.6811728477478027, 1.002708911895752, 1.3242449760437012, 1.6457809209823608, 1.96731698513031, 2.288853168487549, 2.610388994216919, 2.931925058364868, 3.2534611225128174, 3.5749971866607666, 3.896533250808716, 4.218069076538086, 4.539605140686035, 4.861141204833984, 5.182677268981934, 5.504213333129883, 5.825749397277832, 6.147285461425781, 6.4688215255737305, 6.79035758972168, 7.111893653869629, 7.433429718017578, 7.754965782165527, 8.076501846313477, 8.398037910461426, 8.719573974609375, 9.041110038757324, 9.362646102905273, 9.684182167053223, 10.005718231201172, 10.327254295349121, 10.64879035949707, 10.970325469970703, 11.291861534118652, 11.613397598266602, 11.93493366241455, 12.2564697265625, 12.57800579071045, 12.899541854858398, 13.221077919006348, 13.542613983154297, 13.864150047302246, 14.185686111450195, 14.507222175598145, 14.828758239746094, 15.150294303894043, 15.471830368041992, 15.793366432189941, 16.11490249633789]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 6.0, 8.0, 7.0, 18.0, 22.0, 19.0, 30.0, 34.0, 26.0, 48.0, 53.0, 49.0, 52.0, 67.0, 75.0, 68.0, 70.0, 66.0, 46.0, 56.0, 48.0, 34.0, 31.0, 16.0, 11.0, 11.0, 7.0, 6.0, 12.0, 3.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.314805507659912, -2.233933687210083, -2.153061866760254, -2.072190046310425, -1.9913182258605957, -1.9104464054107666, -1.829574704170227, -1.748702883720398, -1.6678310632705688, -1.5869592428207397, -1.5060874223709106, -1.4252156019210815, -1.344343900680542, -1.263472080230713, -1.1826002597808838, -1.1017284393310547, -1.0208566188812256, -0.9399847984313965, -0.8591129779815674, -0.7782412171363831, -0.697369396686554, -0.6164975762367249, -0.5356258153915405, -0.4547539949417114, -0.3738821744918823, -0.2930103540420532, -0.2121385633945465, -0.1312667578458786, -0.05039495229721069, 0.030476868152618408, 0.11134865880012512, 0.19222044944763184, 0.27309250831604004, 0.35396432876586914, 0.43483611941337585, 0.5157079100608826, 0.5965797305107117, 0.6774515509605408, 0.7583233118057251, 0.8391951322555542, 0.9200669527053833, 1.0009387731552124, 1.0818105936050415, 1.1626824140548706, 1.2435541152954102, 1.3244259357452393, 1.4052977561950684, 1.4861695766448975, 1.5670413970947266, 1.6479132175445557, 1.7287850379943848, 1.8096568584442139, 1.890528678894043, 1.971400499343872, 2.052272319793701, 2.133143901824951, 2.2140159606933594, 2.2948877811431885, 2.3757596015930176, 2.4566314220428467, 2.537503242492676, 2.618375062942505, 2.699246883392334, 2.780118465423584, 2.860990285873413]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 4.0, 2.0, 3.0, 4.0, 14.0, 11.0, 35.0, 29.0, 64.0, 86.0, 162.0, 301.0, 536.0, 1066.0, 2165.0, 4576.0, 10290.0, 24902.0, 58125.0, 132819.0, 246826.0, 272102.0, 163721.0, 74689.0, 31584.0, 13204.0, 5693.0, 2639.0, 1374.0, 668.0, 369.0, 180.0, 115.0, 73.0, 38.0, 34.0, 11.0, 17.0, 8.0, 2.0, 6.0, 2.0, 6.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-1.861328125, -1.8098297119140625, -1.758331298828125, -1.7068328857421875, -1.65533447265625, -1.6038360595703125, -1.552337646484375, -1.5008392333984375, -1.4493408203125, -1.3978424072265625, -1.346343994140625, -1.2948455810546875, -1.24334716796875, -1.1918487548828125, -1.140350341796875, -1.0888519287109375, -1.037353515625, -0.9858551025390625, -0.934356689453125, -0.8828582763671875, -0.83135986328125, -0.7798614501953125, -0.728363037109375, -0.6768646240234375, -0.6253662109375, -0.5738677978515625, -0.522369384765625, -0.4708709716796875, -0.41937255859375, -0.3678741455078125, -0.316375732421875, -0.2648773193359375, -0.21337890625, -0.1618804931640625, -0.110382080078125, -0.0588836669921875, -0.00738525390625, 0.0441131591796875, 0.095611572265625, 0.1471099853515625, 0.1986083984375, 0.2501068115234375, 0.301605224609375, 0.3531036376953125, 0.40460205078125, 0.4561004638671875, 0.507598876953125, 0.5590972900390625, 0.610595703125, 0.6620941162109375, 0.713592529296875, 0.7650909423828125, 0.81658935546875, 0.8680877685546875, 0.919586181640625, 0.9710845947265625, 1.0225830078125, 1.0740814208984375, 1.125579833984375, 1.1770782470703125, 1.22857666015625, 1.2800750732421875, 1.331573486328125, 1.3830718994140625, 1.4345703125]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 6.0, 5.0, 4.0, 8.0, 19.0, 16.0, 21.0, 25.0, 30.0, 43.0, 51.0, 47.0, 48.0, 58.0, 83.0, 70.0, 70.0, 68.0, 50.0, 68.0, 55.0, 34.0, 33.0, 20.0, 20.0, 8.0, 9.0, 8.0, 11.0, 7.0, 6.0, 4.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.83984375, -3.6943359375, -3.548828125, -3.4033203125, -3.2578125, -3.1123046875, -2.966796875, -2.8212890625, -2.67578125, -2.5302734375, -2.384765625, -2.2392578125, -2.09375, -1.9482421875, -1.802734375, -1.6572265625, -1.51171875, -1.3662109375, -1.220703125, -1.0751953125, -0.9296875, -0.7841796875, -0.638671875, -0.4931640625, -0.34765625, -0.2021484375, -0.056640625, 0.0888671875, 0.234375, 0.3798828125, 0.525390625, 0.6708984375, 0.81640625, 0.9619140625, 1.107421875, 1.2529296875, 1.3984375, 1.5439453125, 1.689453125, 1.8349609375, 1.98046875, 2.1259765625, 2.271484375, 2.4169921875, 2.5625, 2.7080078125, 2.853515625, 2.9990234375, 3.14453125, 3.2900390625, 3.435546875, 3.5810546875, 3.7265625, 3.8720703125, 4.017578125, 4.1630859375, 4.30859375, 4.4541015625, 4.599609375, 4.7451171875, 4.890625, 5.0361328125, 5.181640625, 5.3271484375, 5.47265625]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 5.0, 5.0, 4.0, 6.0, 12.0, 7.0, 10.0, 6.0, 5.0, 12.0, 14.0, 22.0, 23.0, 29.0, 23.0, 39.0, 39.0, 47.0, 73.0, 126.0, 210.0, 466.0, 3136.0, 277323.0, 755188.0, 10210.0, 700.0, 255.0, 138.0, 90.0, 51.0, 46.0, 31.0, 41.0, 21.0, 18.0, 14.0, 20.0, 16.0, 22.0, 9.0, 11.0, 6.0, 3.0, 6.0, 3.0, 4.0, 5.0, 2.0, 8.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-8.890625, -8.6141357421875, -8.337646484375, -8.0611572265625, -7.78466796875, -7.5081787109375, -7.231689453125, -6.9552001953125, -6.6787109375, -6.4022216796875, -6.125732421875, -5.8492431640625, -5.57275390625, -5.2962646484375, -5.019775390625, -4.7432861328125, -4.466796875, -4.1903076171875, -3.913818359375, -3.6373291015625, -3.36083984375, -3.0843505859375, -2.807861328125, -2.5313720703125, -2.2548828125, -1.9783935546875, -1.701904296875, -1.4254150390625, -1.14892578125, -0.8724365234375, -0.595947265625, -0.3194580078125, -0.04296875, 0.2335205078125, 0.510009765625, 0.7864990234375, 1.06298828125, 1.3394775390625, 1.615966796875, 1.8924560546875, 2.1689453125, 2.4454345703125, 2.721923828125, 2.9984130859375, 3.27490234375, 3.5513916015625, 3.827880859375, 4.1043701171875, 4.380859375, 4.6573486328125, 4.933837890625, 5.2103271484375, 5.48681640625, 5.7633056640625, 6.039794921875, 6.3162841796875, 6.5927734375, 6.8692626953125, 7.145751953125, 7.4222412109375, 7.69873046875, 7.9752197265625, 8.251708984375, 8.5281982421875, 8.8046875]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 6.0, 9.0, 9.0, 8.0, 9.0, 10.0, 13.0, 20.0, 20.0, 24.0, 25.0, 21.0, 21.0, 38.0, 41.0, 43.0, 33.0, 35.0, 41.0, 43.0, 46.0, 47.0, 44.0, 36.0, 33.0, 35.0, 34.0, 30.0, 39.0, 35.0, 31.0, 19.0, 16.0, 17.0, 12.0, 13.0, 11.0, 7.0, 4.0, 6.0, 4.0, 2.0, 5.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.36328125, -3.25921630859375, -3.1551513671875, -3.05108642578125, -2.947021484375, -2.84295654296875, -2.7388916015625, -2.63482666015625, -2.53076171875, -2.42669677734375, -2.3226318359375, -2.21856689453125, -2.114501953125, -2.01043701171875, -1.9063720703125, -1.80230712890625, -1.6982421875, -1.59417724609375, -1.4901123046875, -1.38604736328125, -1.281982421875, -1.17791748046875, -1.0738525390625, -0.96978759765625, -0.86572265625, -0.76165771484375, -0.6575927734375, -0.55352783203125, -0.449462890625, -0.34539794921875, -0.2413330078125, -0.13726806640625, -0.033203125, 0.07086181640625, 0.1749267578125, 0.27899169921875, 0.383056640625, 0.48712158203125, 0.5911865234375, 0.69525146484375, 0.79931640625, 0.90338134765625, 1.0074462890625, 1.11151123046875, 1.215576171875, 1.31964111328125, 1.4237060546875, 1.52777099609375, 1.6318359375, 1.73590087890625, 1.8399658203125, 1.94403076171875, 2.048095703125, 2.15216064453125, 2.2562255859375, 2.36029052734375, 2.46435546875, 2.56842041015625, 2.6724853515625, 2.77655029296875, 2.880615234375, 2.98468017578125, 3.0887451171875, 3.19281005859375, 3.296875]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 4.0, 2.0, 9.0, 5.0, 8.0, 17.0, 45.0, 81.0, 190.0, 601.0, 2565.0, 27000.0, 860918.0, 149886.0, 5636.0, 1020.0, 297.0, 124.0, 68.0, 34.0, 6.0, 7.0, 8.0, 11.0, 5.0, 2.0, 5.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.77734375, -2.6949462890625, -2.612548828125, -2.5301513671875, -2.44775390625, -2.3653564453125, -2.282958984375, -2.2005615234375, -2.1181640625, -2.0357666015625, -1.953369140625, -1.8709716796875, -1.78857421875, -1.7061767578125, -1.623779296875, -1.5413818359375, -1.458984375, -1.3765869140625, -1.294189453125, -1.2117919921875, -1.12939453125, -1.0469970703125, -0.964599609375, -0.8822021484375, -0.7998046875, -0.7174072265625, -0.635009765625, -0.5526123046875, -0.47021484375, -0.3878173828125, -0.305419921875, -0.2230224609375, -0.140625, -0.0582275390625, 0.024169921875, 0.1065673828125, 0.18896484375, 0.2713623046875, 0.353759765625, 0.4361572265625, 0.5185546875, 0.6009521484375, 0.683349609375, 0.7657470703125, 0.84814453125, 0.9305419921875, 1.012939453125, 1.0953369140625, 1.177734375, 1.2601318359375, 1.342529296875, 1.4249267578125, 1.50732421875, 1.5897216796875, 1.672119140625, 1.7545166015625, 1.8369140625, 1.9193115234375, 2.001708984375, 2.0841064453125, 2.16650390625, 2.2489013671875, 2.331298828125, 2.4136962890625, 2.49609375]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 0.0, 3.0, 4.0, 9.0, 4.0, 10.0, 10.0, 19.0, 25.0, 42.0, 52.0, 64.0, 94.0, 93.0, 107.0, 109.0, 90.0, 83.0, 51.0, 35.0, 19.0, 23.0, 14.0, 16.0, 8.0, 7.0, 6.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00017917156219482422, -0.0001738760620355606, -0.000168580561876297, -0.00016328506171703339, -0.00015798956155776978, -0.00015269406139850616, -0.00014739856123924255, -0.00014210306107997894, -0.00013680756092071533, -0.00013151206076145172, -0.0001262165606021881, -0.0001209210604429245, -0.00011562556028366089, -0.00011033006012439728, -0.00010503455996513367, -9.973905980587006e-05, -9.444355964660645e-05, -8.914805948734283e-05, -8.385255932807922e-05, -7.855705916881561e-05, -7.3261559009552e-05, -6.796605885028839e-05, -6.267055869102478e-05, -5.737505853176117e-05, -5.207955837249756e-05, -4.678405821323395e-05, -4.148855805397034e-05, -3.6193057894706726e-05, -3.0897557735443115e-05, -2.5602057576179504e-05, -2.0306557416915894e-05, -1.5011057257652283e-05, -9.715557098388672e-06, -4.420056939125061e-06, 8.754432201385498e-07, 6.170943379402161e-06, 1.1466443538665771e-05, 1.6761943697929382e-05, 2.2057443857192993e-05, 2.7352944016456604e-05, 3.2648444175720215e-05, 3.7943944334983826e-05, 4.3239444494247437e-05, 4.853494465351105e-05, 5.383044481277466e-05, 5.912594497203827e-05, 6.442144513130188e-05, 6.971694529056549e-05, 7.50124454498291e-05, 8.030794560909271e-05, 8.560344576835632e-05, 9.089894592761993e-05, 9.619444608688354e-05, 0.00010148994624614716, 0.00010678544640541077, 0.00011208094656467438, 0.00011737644672393799, 0.0001226719468832016, 0.0001279674470424652, 0.00013326294720172882, 0.00013855844736099243, 0.00014385394752025604, 0.00014914944767951965, 0.00015444494783878326, 0.00015974044799804688]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 1.0, 3.0, 4.0, 2.0, 1.0, 5.0, 4.0, 10.0, 13.0, 15.0, 28.0, 53.0, 112.0, 370.0, 1513.0, 16266.0, 620850.0, 397202.0, 10267.0, 1271.0, 346.0, 98.0, 51.0, 31.0, 13.0, 5.0, 11.0, 3.0, 3.0, 6.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.63671875, -2.558990478515625, -2.48126220703125, -2.403533935546875, -2.3258056640625, -2.248077392578125, -2.17034912109375, -2.092620849609375, -2.014892578125, -1.937164306640625, -1.85943603515625, -1.781707763671875, -1.7039794921875, -1.626251220703125, -1.54852294921875, -1.470794677734375, -1.39306640625, -1.315338134765625, -1.23760986328125, -1.159881591796875, -1.0821533203125, -1.004425048828125, -0.92669677734375, -0.848968505859375, -0.771240234375, -0.693511962890625, -0.61578369140625, -0.538055419921875, -0.4603271484375, -0.382598876953125, -0.30487060546875, -0.227142333984375, -0.1494140625, -0.071685791015625, 0.00604248046875, 0.083770751953125, 0.1614990234375, 0.239227294921875, 0.31695556640625, 0.394683837890625, 0.472412109375, 0.550140380859375, 0.62786865234375, 0.705596923828125, 0.7833251953125, 0.861053466796875, 0.93878173828125, 1.016510009765625, 1.09423828125, 1.171966552734375, 1.24969482421875, 1.327423095703125, 1.4051513671875, 1.482879638671875, 1.56060791015625, 1.638336181640625, 1.716064453125, 1.793792724609375, 1.87152099609375, 1.949249267578125, 2.0269775390625, 2.104705810546875, 2.18243408203125, 2.260162353515625, 2.337890625]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 4.0, 7.0, 8.0, 17.0, 23.0, 21.0, 40.0, 62.0, 64.0, 87.0, 106.0, 107.0, 118.0, 84.0, 72.0, 50.0, 44.0, 27.0, 20.0, 10.0, 6.0, 5.0, 11.0, 0.0, 4.0, 3.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.59912109375, -0.5812911987304688, -0.5634613037109375, -0.5456314086914062, -0.527801513671875, -0.5099716186523438, -0.4921417236328125, -0.47431182861328125, -0.45648193359375, -0.43865203857421875, -0.4208221435546875, -0.40299224853515625, -0.385162353515625, -0.36733245849609375, -0.3495025634765625, -0.33167266845703125, -0.3138427734375, -0.29601287841796875, -0.2781829833984375, -0.26035308837890625, -0.242523193359375, -0.22469329833984375, -0.2068634033203125, -0.18903350830078125, -0.17120361328125, -0.15337371826171875, -0.1355438232421875, -0.11771392822265625, -0.099884033203125, -0.08205413818359375, -0.0642242431640625, -0.04639434814453125, -0.028564453125, -0.01073455810546875, 0.0070953369140625, 0.02492523193359375, 0.042755126953125, 0.06058502197265625, 0.0784149169921875, 0.09624481201171875, 0.11407470703125, 0.13190460205078125, 0.1497344970703125, 0.16756439208984375, 0.185394287109375, 0.20322418212890625, 0.2210540771484375, 0.23888397216796875, 0.2567138671875, 0.27454376220703125, 0.2923736572265625, 0.31020355224609375, 0.328033447265625, 0.34586334228515625, 0.3636932373046875, 0.38152313232421875, 0.39935302734375, 0.41718292236328125, 0.4350128173828125, 0.45284271240234375, 0.470672607421875, 0.48850250244140625, 0.5063323974609375, 0.5241622924804688, 0.5419921875]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 6.0, 9.0, 25.0, 59.0, 144.0, 200.0, 206.0, 162.0, 110.0, 50.0, 22.0, 13.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0], "bins": [-21.55654525756836, -21.14507293701172, -20.733600616455078, -20.322128295898438, -19.910655975341797, -19.499183654785156, -19.087711334228516, -18.676237106323242, -18.2647647857666, -17.85329246520996, -17.44182014465332, -17.03034782409668, -16.61887550354004, -16.207401275634766, -15.795929908752441, -15.3844575881958, -14.97298526763916, -14.56151294708252, -14.150040626525879, -13.738567352294922, -13.327095031738281, -12.91562271118164, -12.504150390625, -12.09267807006836, -11.681205749511719, -11.269733428955078, -10.858261108398438, -10.446788787841797, -10.03531551361084, -9.6238431930542, -9.212370872497559, -8.800898551940918, -8.389424324035645, -7.977952003479004, -7.566479206085205, -7.1550068855285645, -6.743534088134766, -6.332061767578125, -5.920589447021484, -5.509117126464844, -5.097644329071045, -4.686172008514404, -4.2746992111206055, -3.863226890563965, -3.451754331588745, -3.0402817726135254, -2.6288094520568848, -2.217336893081665, -1.8058643341064453, -1.3943917751312256, -0.9829193353652954, -0.5714468955993652, -0.1599743366241455, 0.2514982223510742, 0.6629705429077148, 1.0744431018829346, 1.4859156608581543, 1.897388219833374, 2.3088607788085938, 2.7203330993652344, 3.131805658340454, 3.543278217315674, 3.9547505378723145, 4.366223335266113, 4.777695655822754]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 1.0, 5.0, 5.0, 10.0, 12.0, 13.0, 19.0, 29.0, 18.0, 19.0, 22.0, 40.0, 26.0, 40.0, 49.0, 40.0, 49.0, 47.0, 47.0, 54.0, 57.0, 51.0, 49.0, 37.0, 46.0, 30.0, 40.0, 31.0, 29.0, 13.0, 19.0, 15.0, 15.0, 4.0, 8.0, 7.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.909377098083496, -5.702003479003906, -5.494629859924316, -5.287256240844727, -5.079882621765137, -4.872509002685547, -4.665135383605957, -4.457761764526367, -4.250388145446777, -4.0430145263671875, -3.8356409072875977, -3.628267288208008, -3.420893669128418, -3.213520050048828, -3.0061464309692383, -2.7987728118896484, -2.5913991928100586, -2.3840255737304688, -2.176651954650879, -1.969278335571289, -1.7619047164916992, -1.5545310974121094, -1.3471574783325195, -1.1397838592529297, -0.9324102401733398, -0.72503662109375, -0.5176630020141602, -0.3102893829345703, -0.10291576385498047, 0.10445785522460938, 0.3118314743041992, 0.5192050933837891, 0.7265787124633789, 0.9339523315429688, 1.1413259506225586, 1.3486995697021484, 1.5560731887817383, 1.7634468078613281, 1.970820426940918, 2.178194046020508, 2.3855676651000977, 2.5929412841796875, 2.8003149032592773, 3.007688522338867, 3.215062141418457, 3.422435760498047, 3.6298093795776367, 3.8371829986572266, 4.044556617736816, 4.251930236816406, 4.459303855895996, 4.666677474975586, 4.874051094055176, 5.081424713134766, 5.2887983322143555, 5.496171951293945, 5.703545570373535, 5.910919189453125, 6.118292808532715, 6.325666427612305, 6.5330400466918945, 6.740413665771484, 6.947787284851074, 7.155160903930664, 7.362534523010254]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 7.0, 6.0, 16.0, 19.0, 35.0, 35.0, 42.0, 93.0, 138.0, 203.0, 354.0, 741.0, 2088.0, 12797.0, 205403.0, 2714576.0, 1195646.0, 55574.0, 4755.0, 963.0, 316.0, 180.0, 89.0, 64.0, 41.0, 32.0, 23.0, 14.0, 17.0, 10.0, 6.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.078125, -5.8740234375, -5.669921875, -5.4658203125, -5.26171875, -5.0576171875, -4.853515625, -4.6494140625, -4.4453125, -4.2412109375, -4.037109375, -3.8330078125, -3.62890625, -3.4248046875, -3.220703125, -3.0166015625, -2.8125, -2.6083984375, -2.404296875, -2.2001953125, -1.99609375, -1.7919921875, -1.587890625, -1.3837890625, -1.1796875, -0.9755859375, -0.771484375, -0.5673828125, -0.36328125, -0.1591796875, 0.044921875, 0.2490234375, 0.453125, 0.6572265625, 0.861328125, 1.0654296875, 1.26953125, 1.4736328125, 1.677734375, 1.8818359375, 2.0859375, 2.2900390625, 2.494140625, 2.6982421875, 2.90234375, 3.1064453125, 3.310546875, 3.5146484375, 3.71875, 3.9228515625, 4.126953125, 4.3310546875, 4.53515625, 4.7392578125, 4.943359375, 5.1474609375, 5.3515625, 5.5556640625, 5.759765625, 5.9638671875, 6.16796875, 6.3720703125, 6.576171875, 6.7802734375, 6.984375]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 5.0, 6.0, 11.0, 8.0, 6.0, 6.0, 11.0, 21.0, 23.0, 28.0, 29.0, 34.0, 44.0, 29.0, 56.0, 60.0, 47.0, 49.0, 55.0, 55.0, 60.0, 56.0, 41.0, 45.0, 52.0, 28.0, 36.0, 21.0, 20.0, 17.0, 9.0, 12.0, 5.0, 8.0, 6.0, 9.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.314453125, -2.219879150390625, -2.12530517578125, -2.030731201171875, -1.9361572265625, -1.841583251953125, -1.74700927734375, -1.652435302734375, -1.557861328125, -1.463287353515625, -1.36871337890625, -1.274139404296875, -1.1795654296875, -1.084991455078125, -0.99041748046875, -0.895843505859375, -0.80126953125, -0.706695556640625, -0.61212158203125, -0.517547607421875, -0.4229736328125, -0.328399658203125, -0.23382568359375, -0.139251708984375, -0.044677734375, 0.049896240234375, 0.14447021484375, 0.239044189453125, 0.3336181640625, 0.428192138671875, 0.52276611328125, 0.617340087890625, 0.7119140625, 0.806488037109375, 0.90106201171875, 0.995635986328125, 1.0902099609375, 1.184783935546875, 1.27935791015625, 1.373931884765625, 1.468505859375, 1.563079833984375, 1.65765380859375, 1.752227783203125, 1.8468017578125, 1.941375732421875, 2.03594970703125, 2.130523681640625, 2.22509765625, 2.319671630859375, 2.41424560546875, 2.508819580078125, 2.6033935546875, 2.697967529296875, 2.79254150390625, 2.887115478515625, 2.981689453125, 3.076263427734375, 3.17083740234375, 3.265411376953125, 3.3599853515625, 3.454559326171875, 3.54913330078125, 3.643707275390625, 3.73828125]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 19.0, 25.0, 90.0, 451.0, 7932.0, 4143228.0, 41581.0, 722.0, 172.0, 44.0, 20.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.625, -26.04150390625, -25.4580078125, -24.87451171875, -24.291015625, -23.70751953125, -23.1240234375, -22.54052734375, -21.95703125, -21.37353515625, -20.7900390625, -20.20654296875, -19.623046875, -19.03955078125, -18.4560546875, -17.87255859375, -17.2890625, -16.70556640625, -16.1220703125, -15.53857421875, -14.955078125, -14.37158203125, -13.7880859375, -13.20458984375, -12.62109375, -12.03759765625, -11.4541015625, -10.87060546875, -10.287109375, -9.70361328125, -9.1201171875, -8.53662109375, -7.953125, -7.36962890625, -6.7861328125, -6.20263671875, -5.619140625, -5.03564453125, -4.4521484375, -3.86865234375, -3.28515625, -2.70166015625, -2.1181640625, -1.53466796875, -0.951171875, -0.36767578125, 0.2158203125, 0.79931640625, 1.3828125, 1.96630859375, 2.5498046875, 3.13330078125, 3.716796875, 4.30029296875, 4.8837890625, 5.46728515625, 6.05078125, 6.63427734375, 7.2177734375, 7.80126953125, 8.384765625, 8.96826171875, 9.5517578125, 10.13525390625, 10.71875]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 5.0, 4.0, 10.0, 12.0, 19.0, 18.0, 30.0, 56.0, 103.0, 152.0, 267.0, 384.0, 498.0, 641.0, 624.0, 467.0, 297.0, 182.0, 121.0, 83.0, 45.0, 19.0, 13.0, 8.0, 7.0, 4.0, 2.0, 5.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4130859375, -1.3638763427734375, -1.314666748046875, -1.2654571533203125, -1.21624755859375, -1.1670379638671875, -1.117828369140625, -1.0686187744140625, -1.0194091796875, -0.9701995849609375, -0.920989990234375, -0.8717803955078125, -0.82257080078125, -0.7733612060546875, -0.724151611328125, -0.6749420166015625, -0.625732421875, -0.5765228271484375, -0.527313232421875, -0.4781036376953125, -0.42889404296875, -0.3796844482421875, -0.330474853515625, -0.2812652587890625, -0.2320556640625, -0.1828460693359375, -0.133636474609375, -0.0844268798828125, -0.03521728515625, 0.0139923095703125, 0.063201904296875, 0.1124114990234375, 0.16162109375, 0.2108306884765625, 0.260040283203125, 0.3092498779296875, 0.35845947265625, 0.4076690673828125, 0.456878662109375, 0.5060882568359375, 0.5552978515625, 0.6045074462890625, 0.653717041015625, 0.7029266357421875, 0.75213623046875, 0.8013458251953125, 0.850555419921875, 0.8997650146484375, 0.948974609375, 0.9981842041015625, 1.047393798828125, 1.0966033935546875, 1.14581298828125, 1.1950225830078125, 1.244232177734375, 1.2934417724609375, 1.3426513671875, 1.3918609619140625, 1.441070556640625, 1.4902801513671875, 1.53948974609375, 1.5886993408203125, 1.637908935546875, 1.6871185302734375, 1.736328125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 5.0, 5.0, 15.0, 30.0, 37.0, 44.0, 71.0, 112.0, 132.0, 129.0, 128.0, 108.0, 61.0, 48.0, 34.0, 20.0, 11.0, 7.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.638984680175781, -6.447938442230225, -6.256892204284668, -6.065845966339111, -5.874799728393555, -5.683753967285156, -5.492707252502441, -5.301661491394043, -5.110615253448486, -4.91956901550293, -4.728522777557373, -4.537476539611816, -4.34643030166626, -4.155384063720703, -3.9643380641937256, -3.773292064666748, -3.5822455883026123, -3.3911993503570557, -3.200153112411499, -3.0091071128845215, -2.818060874938965, -2.627014636993408, -2.4359683990478516, -2.244922161102295, -2.0538759231567383, -1.8628296852111816, -1.6717835664749146, -1.480737328529358, -1.2896912097930908, -1.0986449718475342, -0.9075987339019775, -0.7165526151657104, -0.5255064964294434, -0.3344603180885315, -0.14341410994529724, 0.04763209819793701, 0.23867827653884888, 0.42972445487976074, 0.6207706928253174, 0.8118168115615845, 1.0028630495071411, 1.1939092874526978, 1.3849554061889648, 1.5760016441345215, 1.7670478820800781, 1.9580940008163452, 2.1491403579711914, 2.340186357498169, 2.5312325954437256, 2.7222788333892822, 2.913325071334839, 3.1043710708618164, 3.295417308807373, 3.4864635467529297, 3.6775097846984863, 3.868556022644043, 4.0596022605896, 4.250648498535156, 4.441694736480713, 4.6327409744262695, 4.823787212371826, 5.014833450317383, 5.205879211425781, 5.396925449371338, 5.5879716873168945]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 5.0, 2.0, 2.0, 4.0, 4.0, 0.0, 5.0, 8.0, 5.0, 12.0, 10.0, 14.0, 19.0, 17.0, 16.0, 17.0, 18.0, 30.0, 31.0, 29.0, 36.0, 29.0, 41.0, 46.0, 42.0, 44.0, 48.0, 43.0, 55.0, 41.0, 36.0, 29.0, 28.0, 26.0, 33.0, 28.0, 25.0, 14.0, 16.0, 19.0, 21.0, 11.0, 12.0, 8.0, 2.0, 6.0, 5.0, 6.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-2.3792097568511963, -2.297116279602051, -2.2150228023529053, -2.1329293251037598, -2.050835609436035, -1.9687422513961792, -1.8866486549377441, -1.8045551776885986, -1.7224617004394531, -1.6403682231903076, -1.558274745941162, -1.476181149482727, -1.3940876722335815, -1.311994194984436, -1.229900598526001, -1.1478071212768555, -1.06571364402771, -0.9836201667785645, -0.9015266299247742, -0.8194330930709839, -0.7373396158218384, -0.6552461385726929, -0.5731526017189026, -0.4910590648651123, -0.4089655876159668, -0.3268720805644989, -0.244778573513031, -0.1626850664615631, -0.08059155941009521, 0.0015019476413726807, 0.08359545469284058, 0.16568899154663086, 0.24778223037719727, 0.32987573742866516, 0.41196924448013306, 0.49406275153160095, 0.5761562585830688, 0.6582497358322144, 0.7403432726860046, 0.8224368095397949, 0.9045302867889404, 0.9866237640380859, 1.0687172412872314, 1.1508108377456665, 1.232904314994812, 1.3149977922439575, 1.3970913887023926, 1.479184865951538, 1.5612783432006836, 1.643371820449829, 1.7254652976989746, 1.8075588941574097, 1.8896523714065552, 1.9717458486557007, 2.0538394451141357, 2.1359329223632812, 2.2180263996124268, 2.3001198768615723, 2.3822133541107178, 2.4643068313598633, 2.546400547027588, 2.6284940242767334, 2.710587501525879, 2.7926809787750244, 2.87477445602417]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 16.0, 17.0, 21.0, 27.0, 50.0, 101.0, 195.0, 405.0, 1106.0, 4169.0, 23243.0, 195751.0, 664484.0, 136735.0, 17254.0, 3337.0, 934.0, 337.0, 149.0, 93.0, 53.0, 40.0, 18.0, 12.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8994140625, -0.8653717041015625, -0.831329345703125, -0.7972869873046875, -0.76324462890625, -0.7292022705078125, -0.695159912109375, -0.6611175537109375, -0.6270751953125, -0.5930328369140625, -0.558990478515625, -0.5249481201171875, -0.49090576171875, -0.4568634033203125, -0.422821044921875, -0.3887786865234375, -0.354736328125, -0.3206939697265625, -0.286651611328125, -0.2526092529296875, -0.21856689453125, -0.1845245361328125, -0.150482177734375, -0.1164398193359375, -0.0823974609375, -0.0483551025390625, -0.014312744140625, 0.0197296142578125, 0.05377197265625, 0.0878143310546875, 0.121856689453125, 0.1558990478515625, 0.18994140625, 0.2239837646484375, 0.258026123046875, 0.2920684814453125, 0.32611083984375, 0.3601531982421875, 0.394195556640625, 0.4282379150390625, 0.4622802734375, 0.4963226318359375, 0.530364990234375, 0.5644073486328125, 0.59844970703125, 0.6324920654296875, 0.666534423828125, 0.7005767822265625, 0.734619140625, 0.7686614990234375, 0.802703857421875, 0.8367462158203125, 0.87078857421875, 0.9048309326171875, 0.938873291015625, 0.9729156494140625, 1.0069580078125, 1.0410003662109375, 1.075042724609375, 1.1090850830078125, 1.14312744140625, 1.1771697998046875, 1.211212158203125, 1.2452545166015625, 1.279296875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 5.0, 3.0, 6.0, 11.0, 10.0, 20.0, 26.0, 41.0, 28.0, 51.0, 76.0, 94.0, 81.0, 99.0, 86.0, 81.0, 53.0, 56.0, 59.0, 39.0, 19.0, 21.0, 20.0, 9.0, 6.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4921875, -2.382080078125, -2.27197265625, -2.161865234375, -2.0517578125, -1.941650390625, -1.83154296875, -1.721435546875, -1.611328125, -1.501220703125, -1.39111328125, -1.281005859375, -1.1708984375, -1.060791015625, -0.95068359375, -0.840576171875, -0.73046875, -0.620361328125, -0.51025390625, -0.400146484375, -0.2900390625, -0.179931640625, -0.06982421875, 0.040283203125, 0.150390625, 0.260498046875, 0.37060546875, 0.480712890625, 0.5908203125, 0.700927734375, 0.81103515625, 0.921142578125, 1.03125, 1.141357421875, 1.25146484375, 1.361572265625, 1.4716796875, 1.581787109375, 1.69189453125, 1.802001953125, 1.912109375, 2.022216796875, 2.13232421875, 2.242431640625, 2.3525390625, 2.462646484375, 2.57275390625, 2.682861328125, 2.79296875, 2.903076171875, 3.01318359375, 3.123291015625, 3.2333984375, 3.343505859375, 3.45361328125, 3.563720703125, 3.673828125, 3.783935546875, 3.89404296875, 4.004150390625, 4.1142578125, 4.224365234375, 4.33447265625, 4.444580078125, 4.5546875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 5.0, 8.0, 9.0, 17.0, 17.0, 23.0, 47.0, 59.0, 91.0, 159.0, 227.0, 336.0, 544.0, 875.0, 1424.0, 2359.0, 3934.0, 6678.0, 11350.0, 19652.0, 33386.0, 55729.0, 89925.0, 135190.0, 171917.0, 169557.0, 129964.0, 85821.0, 53160.0, 31153.0, 18252.0, 10731.0, 6353.0, 3797.0, 2148.0, 1312.0, 801.0, 558.0, 328.0, 223.0, 146.0, 104.0, 60.0, 32.0, 33.0, 16.0, 14.0, 8.0, 9.0, 6.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.1917724609375, -0.1851482391357422, -0.17852401733398438, -0.17189979553222656, -0.16527557373046875, -0.15865135192871094, -0.15202713012695312, -0.1454029083251953, -0.1387786865234375, -0.1321544647216797, -0.12553024291992188, -0.11890602111816406, -0.11228179931640625, -0.10565757751464844, -0.09903335571289062, -0.09240913391113281, -0.085784912109375, -0.07916069030761719, -0.07253646850585938, -0.06591224670410156, -0.05928802490234375, -0.05266380310058594, -0.046039581298828125, -0.03941535949707031, -0.0327911376953125, -0.026166915893554688, -0.019542694091796875, -0.012918472290039062, -0.00629425048828125, 0.0003299713134765625, 0.006954193115234375, 0.013578414916992188, 0.02020263671875, 0.026826858520507812, 0.033451080322265625, 0.04007530212402344, 0.04669952392578125, 0.05332374572753906, 0.059947967529296875, 0.06657218933105469, 0.0731964111328125, 0.07982063293457031, 0.08644485473632812, 0.09306907653808594, 0.09969329833984375, 0.10631752014160156, 0.11294174194335938, 0.11956596374511719, 0.126190185546875, 0.1328144073486328, 0.13943862915039062, 0.14606285095214844, 0.15268707275390625, 0.15931129455566406, 0.16593551635742188, 0.1725597381591797, 0.1791839599609375, 0.1858081817626953, 0.19243240356445312, 0.19905662536621094, 0.20568084716796875, 0.21230506896972656, 0.21892929077148438, 0.2255535125732422, 0.232177734375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 4.0, 5.0, 5.0, 2.0, 13.0, 16.0, 17.0, 18.0, 25.0, 20.0, 39.0, 40.0, 37.0, 48.0, 24.0, 63.0, 64.0, 50.0, 44.0, 51.0, 48.0, 43.0, 37.0, 36.0, 31.0, 40.0, 29.0, 37.0, 26.0, 18.0, 13.0, 19.0, 11.0, 8.0, 8.0, 10.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.560546875, -3.432220458984375, -3.30389404296875, -3.175567626953125, -3.0472412109375, -2.918914794921875, -2.79058837890625, -2.662261962890625, -2.533935546875, -2.405609130859375, -2.27728271484375, -2.148956298828125, -2.0206298828125, -1.892303466796875, -1.76397705078125, -1.635650634765625, -1.50732421875, -1.378997802734375, -1.25067138671875, -1.122344970703125, -0.9940185546875, -0.865692138671875, -0.73736572265625, -0.609039306640625, -0.480712890625, -0.352386474609375, -0.22406005859375, -0.095733642578125, 0.0325927734375, 0.160919189453125, 0.28924560546875, 0.417572021484375, 0.5458984375, 0.674224853515625, 0.80255126953125, 0.930877685546875, 1.0592041015625, 1.187530517578125, 1.31585693359375, 1.444183349609375, 1.572509765625, 1.700836181640625, 1.82916259765625, 1.957489013671875, 2.0858154296875, 2.214141845703125, 2.34246826171875, 2.470794677734375, 2.59912109375, 2.727447509765625, 2.85577392578125, 2.984100341796875, 3.1124267578125, 3.240753173828125, 3.36907958984375, 3.497406005859375, 3.625732421875, 3.754058837890625, 3.88238525390625, 4.010711669921875, 4.1390380859375, 4.267364501953125, 4.39569091796875, 4.524017333984375, 4.65234375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 8.0, 6.0, 6.0, 17.0, 10.0, 21.0, 33.0, 44.0, 68.0, 92.0, 144.0, 202.0, 348.0, 514.0, 823.0, 1532.0, 2727.0, 5752.0, 13316.0, 34658.0, 96051.0, 236832.0, 335797.0, 195295.0, 75481.0, 27537.0, 10753.0, 4782.0, 2311.0, 1251.0, 780.0, 456.0, 266.0, 195.0, 136.0, 106.0, 73.0, 32.0, 23.0, 18.0, 13.0, 16.0, 10.0, 4.0, 7.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.04296875, -0.0416417121887207, -0.040314674377441406, -0.03898763656616211, -0.03766059875488281, -0.036333560943603516, -0.03500652313232422, -0.03367948532104492, -0.032352447509765625, -0.031025409698486328, -0.02969837188720703, -0.028371334075927734, -0.027044296264648438, -0.02571725845336914, -0.024390220642089844, -0.023063182830810547, -0.02173614501953125, -0.020409107208251953, -0.019082069396972656, -0.01775503158569336, -0.016427993774414062, -0.015100955963134766, -0.013773918151855469, -0.012446880340576172, -0.011119842529296875, -0.009792804718017578, -0.008465766906738281, -0.007138729095458984, -0.0058116912841796875, -0.004484653472900391, -0.0031576156616210938, -0.0018305778503417969, -0.0005035400390625, 0.0008234977722167969, 0.0021505355834960938, 0.0034775733947753906, 0.0048046112060546875, 0.006131649017333984, 0.007458686828613281, 0.008785724639892578, 0.010112762451171875, 0.011439800262451172, 0.012766838073730469, 0.014093875885009766, 0.015420913696289062, 0.01674795150756836, 0.018074989318847656, 0.019402027130126953, 0.02072906494140625, 0.022056102752685547, 0.023383140563964844, 0.02471017837524414, 0.026037216186523438, 0.027364253997802734, 0.02869129180908203, 0.030018329620361328, 0.031345367431640625, 0.03267240524291992, 0.03399944305419922, 0.035326480865478516, 0.03665351867675781, 0.03798055648803711, 0.039307594299316406, 0.0406346321105957, 0.041961669921875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 5.0, 1.0, 5.0, 5.0, 12.0, 6.0, 12.0, 12.0, 26.0, 22.0, 24.0, 35.0, 45.0, 44.0, 53.0, 54.0, 63.0, 74.0, 75.0, 71.0, 68.0, 45.0, 39.0, 48.0, 24.0, 32.0, 22.0, 18.0, 8.0, 13.0, 11.0, 10.0, 3.0, 5.0, 2.0, 2.0, 4.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.361701965332031e-05, -3.2568350434303284e-05, -3.1519681215286255e-05, -3.0471011996269226e-05, -2.9422342777252197e-05, -2.837367355823517e-05, -2.732500433921814e-05, -2.627633512020111e-05, -2.5227665901184082e-05, -2.4178996682167053e-05, -2.3130327463150024e-05, -2.2081658244132996e-05, -2.1032989025115967e-05, -1.9984319806098938e-05, -1.893565058708191e-05, -1.788698136806488e-05, -1.683831214904785e-05, -1.5789642930030823e-05, -1.4740973711013794e-05, -1.3692304491996765e-05, -1.2643635272979736e-05, -1.1594966053962708e-05, -1.0546296834945679e-05, -9.49762761592865e-06, -8.448958396911621e-06, -7.400289177894592e-06, -6.3516199588775635e-06, -5.302950739860535e-06, -4.254281520843506e-06, -3.205612301826477e-06, -2.1569430828094482e-06, -1.1082738637924194e-06, -5.960464477539063e-08, 9.890645742416382e-07, 2.037733793258667e-06, 3.086403012275696e-06, 4.135072231292725e-06, 5.183741450309753e-06, 6.232410669326782e-06, 7.281079888343811e-06, 8.32974910736084e-06, 9.378418326377869e-06, 1.0427087545394897e-05, 1.1475756764411926e-05, 1.2524425983428955e-05, 1.3573095202445984e-05, 1.4621764421463013e-05, 1.567043364048004e-05, 1.671910285949707e-05, 1.77677720785141e-05, 1.8816441297531128e-05, 1.9865110516548157e-05, 2.0913779735565186e-05, 2.1962448954582214e-05, 2.3011118173599243e-05, 2.4059787392616272e-05, 2.51084566116333e-05, 2.615712583065033e-05, 2.720579504966736e-05, 2.8254464268684387e-05, 2.9303133487701416e-05, 3.0351802706718445e-05, 3.1400471925735474e-05, 3.24491411447525e-05, 3.349781036376953e-05]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 0.0, 4.0, 4.0, 5.0, 5.0, 14.0, 14.0, 19.0, 29.0, 46.0, 82.0, 156.0, 291.0, 565.0, 1480.0, 4565.0, 16836.0, 79714.0, 367949.0, 438856.0, 107131.0, 21833.0, 5687.0, 1787.0, 732.0, 328.0, 169.0, 90.0, 58.0, 33.0, 23.0, 8.0, 10.0, 10.0, 6.0, 3.0, 1.0, 6.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.06640625, -0.06427001953125, -0.0621337890625, -0.05999755859375, -0.057861328125, -0.05572509765625, -0.0535888671875, -0.05145263671875, -0.04931640625, -0.04718017578125, -0.0450439453125, -0.04290771484375, -0.040771484375, -0.03863525390625, -0.0364990234375, -0.03436279296875, -0.0322265625, -0.03009033203125, -0.0279541015625, -0.02581787109375, -0.023681640625, -0.02154541015625, -0.0194091796875, -0.01727294921875, -0.01513671875, -0.01300048828125, -0.0108642578125, -0.00872802734375, -0.006591796875, -0.00445556640625, -0.0023193359375, -0.00018310546875, 0.001953125, 0.00408935546875, 0.0062255859375, 0.00836181640625, 0.010498046875, 0.01263427734375, 0.0147705078125, 0.01690673828125, 0.01904296875, 0.02117919921875, 0.0233154296875, 0.02545166015625, 0.027587890625, 0.02972412109375, 0.0318603515625, 0.03399658203125, 0.0361328125, 0.03826904296875, 0.0404052734375, 0.04254150390625, 0.044677734375, 0.04681396484375, 0.0489501953125, 0.05108642578125, 0.05322265625, 0.05535888671875, 0.0574951171875, 0.05963134765625, 0.061767578125, 0.06390380859375, 0.0660400390625, 0.06817626953125, 0.0703125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 3.0, 7.0, 6.0, 3.0, 1.0, 8.0, 8.0, 11.0, 24.0, 15.0, 22.0, 32.0, 45.0, 59.0, 70.0, 88.0, 82.0, 77.0, 90.0, 70.0, 70.0, 47.0, 35.0, 28.0, 27.0, 18.0, 14.0, 9.0, 5.0, 6.0, 4.0, 4.0, 6.0, 4.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01763916015625, -0.017047643661499023, -0.016456127166748047, -0.01586461067199707, -0.015273094177246094, -0.014681577682495117, -0.01409006118774414, -0.013498544692993164, -0.012907028198242188, -0.012315511703491211, -0.011723995208740234, -0.011132478713989258, -0.010540962219238281, -0.009949445724487305, -0.009357929229736328, -0.008766412734985352, -0.008174896240234375, -0.0075833797454833984, -0.006991863250732422, -0.006400346755981445, -0.005808830261230469, -0.005217313766479492, -0.004625797271728516, -0.004034280776977539, -0.0034427642822265625, -0.002851247787475586, -0.0022597312927246094, -0.0016682147979736328, -0.0010766983032226562, -0.0004851818084716797, 0.00010633468627929688, 0.0006978511810302734, 0.00128936767578125, 0.0018808841705322266, 0.002472400665283203, 0.0030639171600341797, 0.0036554336547851562, 0.004246950149536133, 0.004838466644287109, 0.005429983139038086, 0.0060214996337890625, 0.006613016128540039, 0.007204532623291016, 0.007796049118041992, 0.008387565612792969, 0.008979082107543945, 0.009570598602294922, 0.010162115097045898, 0.010753631591796875, 0.011345148086547852, 0.011936664581298828, 0.012528181076049805, 0.013119697570800781, 0.013711214065551758, 0.014302730560302734, 0.014894247055053711, 0.015485763549804688, 0.016077280044555664, 0.01666879653930664, 0.017260313034057617, 0.017851829528808594, 0.01844334602355957, 0.019034862518310547, 0.019626379013061523, 0.0202178955078125]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 16.0, 113.0, 363.0, 373.0, 115.0, 20.0, 7.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.987186431884766, -8.596941947937012, -8.206696510314941, -7.8164520263671875, -7.426207542419434, -7.0359625816345215, -6.645717620849609, -6.2554731369018555, -5.865228176116943, -5.474983215332031, -5.084738731384277, -4.694493770599365, -4.304248809814453, -3.914004325866699, -3.523759365081787, -3.133514642715454, -2.743269920349121, -2.353025197982788, -1.9627803564071655, -1.572535514831543, -1.18229079246521, -0.792046070098877, -0.40180110931396484, -0.011556386947631836, 0.37868833541870117, 0.768933117389679, 1.1591778993606567, 1.5494227409362793, 1.9396674633026123, 2.3299121856689453, 2.7201571464538574, 3.1104018688201904, 3.5006465911865234, 3.8908913135528564, 4.2811360359191895, 4.671380996704102, 5.0616254806518555, 5.451870441436768, 5.84211540222168, 6.232359886169434, 6.622604846954346, 7.012849807739258, 7.403094291687012, 7.793339252471924, 8.183584213256836, 8.57382869720459, 8.964073181152344, 9.354318618774414, 9.744563102722168, 10.134807586669922, 10.525053024291992, 10.915297508239746, 11.3055419921875, 11.69578742980957, 12.086031913757324, 12.476276397705078, 12.866521835327148, 13.256766319274902, 13.647011756896973, 14.037256240844727, 14.42750072479248, 14.817745208740234, 15.207990646362305, 15.598235130310059, 15.988479614257812]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 2.0, 4.0, 1.0, 7.0, 4.0, 4.0, 12.0, 15.0, 17.0, 24.0, 31.0, 23.0, 42.0, 49.0, 45.0, 56.0, 77.0, 67.0, 68.0, 75.0, 65.0, 47.0, 47.0, 45.0, 38.0, 37.0, 22.0, 19.0, 18.0, 16.0, 3.0, 8.0, 7.0, 4.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.84909725189209, -2.7684621810913086, -2.6878268718719482, -2.607191801071167, -2.5265567302703857, -2.4459214210510254, -2.365286350250244, -2.284651279449463, -2.2040159702301025, -2.1233808994293213, -2.042745590209961, -1.9621105194091797, -1.8814753293991089, -1.800840139389038, -1.7202050685882568, -1.639569878578186, -1.5589348077774048, -1.478299617767334, -1.3976645469665527, -1.317029356956482, -1.2363941669464111, -1.1557590961456299, -1.075123906135559, -0.9944887161254883, -0.9138535857200623, -0.8332184553146362, -0.7525832653045654, -0.6719481348991394, -0.5913130044937134, -0.5106778144836426, -0.43004268407821655, -0.34940749406814575, -0.2687723636627197, -0.1881372034549713, -0.1075020581483841, -0.026866912841796875, 0.05376824736595154, 0.13440340757369995, 0.21503853797912598, 0.2956737279891968, 0.3763088583946228, 0.4569440186023712, 0.5375791788101196, 0.6182143092155457, 0.6988494396209717, 0.7794846296310425, 0.8601197600364685, 0.9407549500465393, 1.0213900804519653, 1.1020252704620361, 1.1826603412628174, 1.2632955312728882, 1.343930721282959, 1.4245657920837402, 1.505200982093811, 1.5858361721038818, 1.666471242904663, 1.7471064329147339, 1.8277415037155151, 1.908376693725586, 1.9890118837356567, 2.0696470737457275, 2.150282144546509, 2.230917453765869, 2.3115525245666504]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 0.0, 2.0, 2.0, 5.0, 6.0, 7.0, 9.0, 6.0, 9.0, 5.0, 11.0, 14.0, 10.0, 20.0, 16.0, 32.0, 46.0, 69.0, 121.0, 476.0, 4473.0, 73933.0, 705773.0, 247476.0, 14392.0, 1107.0, 202.0, 82.0, 60.0, 49.0, 32.0, 22.0, 20.0, 14.0, 12.0, 11.0, 8.0, 4.0, 7.0, 6.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.11328125, -5.9205322265625, -5.727783203125, -5.5350341796875, -5.34228515625, -5.1495361328125, -4.956787109375, -4.7640380859375, -4.5712890625, -4.3785400390625, -4.185791015625, -3.9930419921875, -3.80029296875, -3.6075439453125, -3.414794921875, -3.2220458984375, -3.029296875, -2.8365478515625, -2.643798828125, -2.4510498046875, -2.25830078125, -2.0655517578125, -1.872802734375, -1.6800537109375, -1.4873046875, -1.2945556640625, -1.101806640625, -0.9090576171875, -0.71630859375, -0.5235595703125, -0.330810546875, -0.1380615234375, 0.0546875, 0.2474365234375, 0.440185546875, 0.6329345703125, 0.82568359375, 1.0184326171875, 1.211181640625, 1.4039306640625, 1.5966796875, 1.7894287109375, 1.982177734375, 2.1749267578125, 2.36767578125, 2.5604248046875, 2.753173828125, 2.9459228515625, 3.138671875, 3.3314208984375, 3.524169921875, 3.7169189453125, 3.90966796875, 4.1024169921875, 4.295166015625, 4.4879150390625, 4.6806640625, 4.8734130859375, 5.066162109375, 5.2589111328125, 5.45166015625, 5.6444091796875, 5.837158203125, 6.0299072265625, 6.22265625]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 5.0, 7.0, 16.0, 20.0, 57.0, 67.0, 107.0, 164.0, 163.0, 152.0, 92.0, 79.0, 41.0, 24.0, 8.0, 8.0, 5.0, 1.0, 0.0, 2.0], "bins": [-17.25, -16.920684814453125, -16.59136962890625, -16.262054443359375, -15.9327392578125, -15.603424072265625, -15.27410888671875, -14.944793701171875, -14.615478515625, -14.286163330078125, -13.95684814453125, -13.627532958984375, -13.2982177734375, -12.968902587890625, -12.63958740234375, -12.310272216796875, -11.98095703125, -11.651641845703125, -11.32232666015625, -10.993011474609375, -10.6636962890625, -10.334381103515625, -10.00506591796875, -9.675750732421875, -9.346435546875, -9.017120361328125, -8.68780517578125, -8.358489990234375, -8.0291748046875, -7.699859619140625, -7.37054443359375, -7.041229248046875, -6.7119140625, -6.382598876953125, -6.05328369140625, -5.723968505859375, -5.3946533203125, -5.065338134765625, -4.73602294921875, -4.406707763671875, -4.077392578125, -3.748077392578125, -3.41876220703125, -3.089447021484375, -2.7601318359375, -2.430816650390625, -2.10150146484375, -1.772186279296875, -1.44287109375, -1.113555908203125, -0.78424072265625, -0.454925537109375, -0.1256103515625, 0.203704833984375, 0.53302001953125, 0.862335205078125, 1.191650390625, 1.520965576171875, 1.85028076171875, 2.179595947265625, 2.5089111328125, 2.838226318359375, 3.16754150390625, 3.496856689453125, 3.826171875]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 6.0, 5.0, 12.0, 28.0, 29.0, 40.0, 47.0, 76.0, 103.0, 95.0, 128.0, 159.0, 248.0, 382.0, 1045.0, 10683.0, 260721.0, 721425.0, 49149.0, 2541.0, 528.0, 271.0, 209.0, 157.0, 122.0, 98.0, 68.0, 61.0, 38.0, 24.0, 21.0, 13.0, 6.0, 6.0, 9.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.99609375, -5.80413818359375, -5.6121826171875, -5.42022705078125, -5.228271484375, -5.03631591796875, -4.8443603515625, -4.65240478515625, -4.46044921875, -4.26849365234375, -4.0765380859375, -3.88458251953125, -3.692626953125, -3.50067138671875, -3.3087158203125, -3.11676025390625, -2.9248046875, -2.73284912109375, -2.5408935546875, -2.34893798828125, -2.156982421875, -1.96502685546875, -1.7730712890625, -1.58111572265625, -1.38916015625, -1.19720458984375, -1.0052490234375, -0.81329345703125, -0.621337890625, -0.42938232421875, -0.2374267578125, -0.04547119140625, 0.146484375, 0.33843994140625, 0.5303955078125, 0.72235107421875, 0.914306640625, 1.10626220703125, 1.2982177734375, 1.49017333984375, 1.68212890625, 1.87408447265625, 2.0660400390625, 2.25799560546875, 2.449951171875, 2.64190673828125, 2.8338623046875, 3.02581787109375, 3.2177734375, 3.40972900390625, 3.6016845703125, 3.79364013671875, 3.985595703125, 4.17755126953125, 4.3695068359375, 4.56146240234375, 4.75341796875, 4.94537353515625, 5.1373291015625, 5.32928466796875, 5.521240234375, 5.71319580078125, 5.9051513671875, 6.09710693359375, 6.2890625]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 6.0, 6.0, 8.0, 8.0, 14.0, 12.0, 23.0, 29.0, 35.0, 27.0, 32.0, 41.0, 42.0, 34.0, 44.0, 43.0, 46.0, 37.0, 51.0, 61.0, 50.0, 57.0, 41.0, 35.0, 24.0, 37.0, 39.0, 23.0, 19.0, 16.0, 12.0, 16.0, 6.0, 4.0, 2.0, 5.0, 6.0, 3.0, 4.0, 1.0, 4.0, 3.0, 0.0, 1.0, 1.0], "bins": [-4.2265625, -4.112762451171875, -3.99896240234375, -3.885162353515625, -3.7713623046875, -3.657562255859375, -3.54376220703125, -3.429962158203125, -3.316162109375, -3.202362060546875, -3.08856201171875, -2.974761962890625, -2.8609619140625, -2.747161865234375, -2.63336181640625, -2.519561767578125, -2.40576171875, -2.291961669921875, -2.17816162109375, -2.064361572265625, -1.9505615234375, -1.836761474609375, -1.72296142578125, -1.609161376953125, -1.495361328125, -1.381561279296875, -1.26776123046875, -1.153961181640625, -1.0401611328125, -0.926361083984375, -0.81256103515625, -0.698760986328125, -0.5849609375, -0.471160888671875, -0.35736083984375, -0.243560791015625, -0.1297607421875, -0.015960693359375, 0.09783935546875, 0.211639404296875, 0.325439453125, 0.439239501953125, 0.55303955078125, 0.666839599609375, 0.7806396484375, 0.894439697265625, 1.00823974609375, 1.122039794921875, 1.23583984375, 1.349639892578125, 1.46343994140625, 1.577239990234375, 1.6910400390625, 1.804840087890625, 1.91864013671875, 2.032440185546875, 2.146240234375, 2.260040283203125, 2.37384033203125, 2.487640380859375, 2.6014404296875, 2.715240478515625, 2.82904052734375, 2.942840576171875, 3.056640625]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 4.0, 3.0, 4.0, 3.0, 3.0, 3.0, 8.0, 5.0, 9.0, 17.0, 25.0, 29.0, 87.0, 145.0, 425.0, 1713.0, 11048.0, 384600.0, 631699.0, 15569.0, 2266.0, 514.0, 165.0, 72.0, 46.0, 22.0, 10.0, 13.0, 14.0, 10.0, 0.0, 4.0, 5.0, 3.0, 3.0, 2.0, 2.0, 4.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.98046875, -2.884552001953125, -2.78863525390625, -2.692718505859375, -2.5968017578125, -2.500885009765625, -2.40496826171875, -2.309051513671875, -2.213134765625, -2.117218017578125, -2.02130126953125, -1.925384521484375, -1.8294677734375, -1.733551025390625, -1.63763427734375, -1.541717529296875, -1.44580078125, -1.349884033203125, -1.25396728515625, -1.158050537109375, -1.0621337890625, -0.966217041015625, -0.87030029296875, -0.774383544921875, -0.678466796875, -0.582550048828125, -0.48663330078125, -0.390716552734375, -0.2947998046875, -0.198883056640625, -0.10296630859375, -0.007049560546875, 0.0888671875, 0.184783935546875, 0.28070068359375, 0.376617431640625, 0.4725341796875, 0.568450927734375, 0.66436767578125, 0.760284423828125, 0.856201171875, 0.952117919921875, 1.04803466796875, 1.143951416015625, 1.2398681640625, 1.335784912109375, 1.43170166015625, 1.527618408203125, 1.62353515625, 1.719451904296875, 1.81536865234375, 1.911285400390625, 2.0072021484375, 2.103118896484375, 2.19903564453125, 2.294952392578125, 2.390869140625, 2.486785888671875, 2.58270263671875, 2.678619384765625, 2.7745361328125, 2.870452880859375, 2.96636962890625, 3.062286376953125, 3.158203125]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 8.0, 3.0, 21.0, 18.0, 24.0, 28.0, 35.0, 68.0, 76.0, 91.0, 96.0, 98.0, 87.0, 83.0, 58.0, 60.0, 32.0, 24.0, 27.0, 14.0, 10.0, 11.0, 6.0, 3.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00021398067474365234, -0.0002077445387840271, -0.00020150840282440186, -0.0001952722668647766, -0.00018903613090515137, -0.00018279999494552612, -0.00017656385898590088, -0.00017032772302627563, -0.0001640915870666504, -0.00015785545110702515, -0.0001516193151473999, -0.00014538317918777466, -0.00013914704322814941, -0.00013291090726852417, -0.00012667477130889893, -0.00012043863534927368, -0.00011420249938964844, -0.0001079663634300232, -0.00010173022747039795, -9.54940915107727e-05, -8.925795555114746e-05, -8.302181959152222e-05, -7.678568363189697e-05, -7.054954767227173e-05, -6.431341171264648e-05, -5.807727575302124e-05, -5.1841139793395996e-05, -4.560500383377075e-05, -3.936886787414551e-05, -3.3132731914520264e-05, -2.689659595489502e-05, -2.0660459995269775e-05, -1.4424324035644531e-05, -8.188188076019287e-06, -1.952052116394043e-06, 4.284083843231201e-06, 1.0520219802856445e-05, 1.675635576248169e-05, 2.2992491722106934e-05, 2.9228627681732178e-05, 3.546476364135742e-05, 4.1700899600982666e-05, 4.793703556060791e-05, 5.4173171520233154e-05, 6.04093074798584e-05, 6.664544343948364e-05, 7.288157939910889e-05, 7.911771535873413e-05, 8.535385131835938e-05, 9.158998727798462e-05, 9.782612323760986e-05, 0.00010406225919723511, 0.00011029839515686035, 0.0001165345311164856, 0.00012277066707611084, 0.00012900680303573608, 0.00013524293899536133, 0.00014147907495498657, 0.00014771521091461182, 0.00015395134687423706, 0.0001601874828338623, 0.00016642361879348755, 0.0001726597547531128, 0.00017889589071273804, 0.00018513202667236328]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 7.0, 8.0, 5.0, 11.0, 13.0, 17.0, 29.0, 49.0, 70.0, 175.0, 442.0, 2333.0, 31065.0, 917374.0, 91851.0, 3989.0, 675.0, 207.0, 99.0, 45.0, 20.0, 18.0, 6.0, 16.0, 6.0, 3.0, 4.0, 7.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.39453125, -3.287200927734375, -3.17987060546875, -3.072540283203125, -2.9652099609375, -2.857879638671875, -2.75054931640625, -2.643218994140625, -2.535888671875, -2.428558349609375, -2.32122802734375, -2.213897705078125, -2.1065673828125, -1.999237060546875, -1.89190673828125, -1.784576416015625, -1.67724609375, -1.569915771484375, -1.46258544921875, -1.355255126953125, -1.2479248046875, -1.140594482421875, -1.03326416015625, -0.925933837890625, -0.818603515625, -0.711273193359375, -0.60394287109375, -0.496612548828125, -0.3892822265625, -0.281951904296875, -0.17462158203125, -0.067291259765625, 0.0400390625, 0.147369384765625, 0.25469970703125, 0.362030029296875, 0.4693603515625, 0.576690673828125, 0.68402099609375, 0.791351318359375, 0.898681640625, 1.006011962890625, 1.11334228515625, 1.220672607421875, 1.3280029296875, 1.435333251953125, 1.54266357421875, 1.649993896484375, 1.75732421875, 1.864654541015625, 1.97198486328125, 2.079315185546875, 2.1866455078125, 2.293975830078125, 2.40130615234375, 2.508636474609375, 2.615966796875, 2.723297119140625, 2.83062744140625, 2.937957763671875, 3.0452880859375, 3.152618408203125, 3.25994873046875, 3.367279052734375, 3.474609375]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 8.0, 7.0, 8.0, 17.0, 26.0, 35.0, 52.0, 66.0, 79.0, 102.0, 110.0, 97.0, 98.0, 81.0, 58.0, 50.0, 26.0, 21.0, 11.0, 13.0, 6.0, 8.0, 3.0, 1.0, 5.0, 6.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.57275390625, -0.5522308349609375, -0.531707763671875, -0.5111846923828125, -0.49066162109375, -0.4701385498046875, -0.449615478515625, -0.4290924072265625, -0.4085693359375, -0.3880462646484375, -0.367523193359375, -0.3470001220703125, -0.32647705078125, -0.3059539794921875, -0.285430908203125, -0.2649078369140625, -0.244384765625, -0.2238616943359375, -0.203338623046875, -0.1828155517578125, -0.16229248046875, -0.1417694091796875, -0.121246337890625, -0.1007232666015625, -0.0802001953125, -0.0596771240234375, -0.039154052734375, -0.0186309814453125, 0.00189208984375, 0.0224151611328125, 0.042938232421875, 0.0634613037109375, 0.083984375, 0.1045074462890625, 0.125030517578125, 0.1455535888671875, 0.16607666015625, 0.1865997314453125, 0.207122802734375, 0.2276458740234375, 0.2481689453125, 0.2686920166015625, 0.289215087890625, 0.3097381591796875, 0.33026123046875, 0.3507843017578125, 0.371307373046875, 0.3918304443359375, 0.412353515625, 0.4328765869140625, 0.453399658203125, 0.4739227294921875, 0.49444580078125, 0.5149688720703125, 0.535491943359375, 0.5560150146484375, 0.5765380859375, 0.5970611572265625, 0.617584228515625, 0.6381072998046875, 0.65863037109375, 0.6791534423828125, 0.699676513671875, 0.7201995849609375, 0.74072265625]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 6.0, 17.0, 11.0, 25.0, 47.0, 47.0, 77.0, 107.0, 114.0, 123.0, 118.0, 89.0, 66.0, 57.0, 35.0, 18.0, 16.0, 11.0, 8.0, 4.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.46297025680542, -6.257547855377197, -6.052124977111816, -5.846702575683594, -5.641280174255371, -5.435857772827148, -5.230434894561768, -5.025012493133545, -4.819589614868164, -4.614167213439941, -4.4087443351745605, -4.203321933746338, -3.9978995323181152, -3.7924768924713135, -3.5870542526245117, -3.381631851196289, -3.1762094497680664, -2.9707868099212646, -2.765364408493042, -2.5599417686462402, -2.3545193672180176, -2.149096727371216, -1.943674087524414, -1.7382515668869019, -1.5328290462493896, -1.3274065256118774, -1.1219840049743652, -0.9165613651275635, -0.7111388444900513, -0.5057163238525391, -0.3002936840057373, -0.0948711633682251, 0.11055135726928711, 0.3159739077091217, 0.5213964581489563, 0.7268190383911133, 0.9322415590286255, 1.1376640796661377, 1.3430867195129395, 1.5485092401504517, 1.7539317607879639, 1.959354281425476, 2.1647768020629883, 2.37019944190979, 2.575622081756592, 2.7810444831848145, 2.986467123031616, 3.191889762878418, 3.3973121643066406, 3.6027348041534424, 3.808157205581665, 4.013579845428467, 4.2190022468566895, 4.42442512512207, 4.629847526550293, 4.835269927978516, 5.040692329406738, 5.246114730834961, 5.451537609100342, 5.6569600105285645, 5.862382411956787, 6.067805290222168, 6.273227691650391, 6.478650093078613, 6.684072971343994]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 7.0, 3.0, 7.0, 12.0, 11.0, 18.0, 26.0, 26.0, 38.0, 40.0, 34.0, 61.0, 65.0, 66.0, 66.0, 61.0, 67.0, 76.0, 62.0, 60.0, 44.0, 39.0, 34.0, 24.0, 21.0, 17.0, 11.0, 4.0, 7.0, 5.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-11.972057342529297, -11.689726829528809, -11.40739631652832, -11.125065803527832, -10.842735290527344, -10.560403823852539, -10.278074264526367, -9.995742797851562, -9.713412284851074, -9.431081771850586, -9.148751258850098, -8.86642074584961, -8.584090232849121, -8.301759719848633, -8.019428253173828, -7.737098217010498, -7.45476770401001, -7.1724371910095215, -6.890106678009033, -6.607775688171387, -6.325445175170898, -6.04311466217041, -5.760784149169922, -5.478453636169434, -5.196123123168945, -4.913792610168457, -4.631462097167969, -4.3491315841674805, -4.066800594329834, -3.7844700813293457, -3.5021395683288574, -3.219809055328369, -2.9374780654907227, -2.6551475524902344, -2.372816801071167, -2.0904862880706787, -1.8081556558609009, -1.525825023651123, -1.2434945106506348, -0.9611638784408569, -0.6788332462310791, -0.39650264382362366, -0.11417204141616821, 0.16815853118896484, 0.4504891633987427, 0.7328197956085205, 1.0151503086090088, 1.2974809408187866, 1.5798115730285645, 1.8621422052383423, 2.14447283744812, 2.4268033504486084, 2.709134101867676, 2.991464614868164, 3.2737951278686523, 3.5561256408691406, 3.838456392288208, 4.120787143707275, 4.403117656707764, 4.685448169708252, 4.96777868270874, 5.250109672546387, 5.532440185546875, 5.814770698547363, 6.097101211547852]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 5.0, 4.0, 2.0, 6.0, 3.0, 15.0, 16.0, 28.0, 35.0, 50.0, 68.0, 106.0, 149.0, 253.0, 447.0, 946.0, 4906.0, 97344.0, 2601769.0, 1441915.0, 42289.0, 2613.0, 571.0, 277.0, 156.0, 100.0, 72.0, 48.0, 34.0, 15.0, 9.0, 11.0, 11.0, 4.0, 2.0, 5.0, 4.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.94921875, -4.73284912109375, -4.5164794921875, -4.30010986328125, -4.083740234375, -3.86737060546875, -3.6510009765625, -3.43463134765625, -3.21826171875, -3.00189208984375, -2.7855224609375, -2.56915283203125, -2.352783203125, -2.13641357421875, -1.9200439453125, -1.70367431640625, -1.4873046875, -1.27093505859375, -1.0545654296875, -0.83819580078125, -0.621826171875, -0.40545654296875, -0.1890869140625, 0.02728271484375, 0.24365234375, 0.46002197265625, 0.6763916015625, 0.89276123046875, 1.109130859375, 1.32550048828125, 1.5418701171875, 1.75823974609375, 1.974609375, 2.19097900390625, 2.4073486328125, 2.62371826171875, 2.840087890625, 3.05645751953125, 3.2728271484375, 3.48919677734375, 3.70556640625, 3.92193603515625, 4.1383056640625, 4.35467529296875, 4.571044921875, 4.78741455078125, 5.0037841796875, 5.22015380859375, 5.4365234375, 5.65289306640625, 5.8692626953125, 6.08563232421875, 6.302001953125, 6.51837158203125, 6.7347412109375, 6.95111083984375, 7.16748046875, 7.38385009765625, 7.6002197265625, 7.81658935546875, 8.032958984375, 8.24932861328125, 8.4656982421875, 8.68206787109375, 8.8984375]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 5.0, 0.0, 2.0, 2.0, 4.0, 4.0, 3.0, 4.0, 4.0, 7.0, 5.0, 12.0, 14.0, 16.0, 26.0, 26.0, 23.0, 38.0, 44.0, 42.0, 38.0, 55.0, 51.0, 64.0, 50.0, 66.0, 48.0, 46.0, 46.0, 44.0, 30.0, 46.0, 27.0, 21.0, 18.0, 17.0, 12.0, 18.0, 9.0, 10.0, 5.0, 4.0, 1.0, 7.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.587890625, -2.49700927734375, -2.4061279296875, -2.31524658203125, -2.224365234375, -2.13348388671875, -2.0426025390625, -1.95172119140625, -1.86083984375, -1.76995849609375, -1.6790771484375, -1.58819580078125, -1.497314453125, -1.40643310546875, -1.3155517578125, -1.22467041015625, -1.1337890625, -1.04290771484375, -0.9520263671875, -0.86114501953125, -0.770263671875, -0.67938232421875, -0.5885009765625, -0.49761962890625, -0.40673828125, -0.31585693359375, -0.2249755859375, -0.13409423828125, -0.043212890625, 0.04766845703125, 0.1385498046875, 0.22943115234375, 0.3203125, 0.41119384765625, 0.5020751953125, 0.59295654296875, 0.683837890625, 0.77471923828125, 0.8656005859375, 0.95648193359375, 1.04736328125, 1.13824462890625, 1.2291259765625, 1.32000732421875, 1.410888671875, 1.50177001953125, 1.5926513671875, 1.68353271484375, 1.7744140625, 1.86529541015625, 1.9561767578125, 2.04705810546875, 2.137939453125, 2.22882080078125, 2.3197021484375, 2.41058349609375, 2.50146484375, 2.59234619140625, 2.6832275390625, 2.77410888671875, 2.864990234375, 2.95587158203125, 3.0467529296875, 3.13763427734375, 3.228515625]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 7.0, 8.0, 10.0, 31.0, 81.0, 240.0, 691.0, 3497.0, 225773.0, 3938379.0, 23183.0, 1672.0, 436.0, 181.0, 62.0, 23.0, 12.0, 3.0, 3.0, 4.0], "bins": [-18.015625, -17.677642822265625, -17.33966064453125, -17.001678466796875, -16.6636962890625, -16.325714111328125, -15.98773193359375, -15.649749755859375, -15.311767578125, -14.973785400390625, -14.63580322265625, -14.297821044921875, -13.9598388671875, -13.621856689453125, -13.28387451171875, -12.945892333984375, -12.60791015625, -12.269927978515625, -11.93194580078125, -11.593963623046875, -11.2559814453125, -10.917999267578125, -10.58001708984375, -10.242034912109375, -9.904052734375, -9.566070556640625, -9.22808837890625, -8.890106201171875, -8.5521240234375, -8.214141845703125, -7.87615966796875, -7.538177490234375, -7.2001953125, -6.862213134765625, -6.52423095703125, -6.186248779296875, -5.8482666015625, -5.510284423828125, -5.17230224609375, -4.834320068359375, -4.496337890625, -4.158355712890625, -3.82037353515625, -3.482391357421875, -3.1444091796875, -2.806427001953125, -2.46844482421875, -2.130462646484375, -1.79248046875, -1.454498291015625, -1.11651611328125, -0.778533935546875, -0.4405517578125, -0.102569580078125, 0.23541259765625, 0.573394775390625, 0.911376953125, 1.249359130859375, 1.58734130859375, 1.925323486328125, 2.2633056640625, 2.601287841796875, 2.93927001953125, 3.277252197265625, 3.615234375]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 8.0, 7.0, 8.0, 14.0, 24.0, 31.0, 27.0, 38.0, 59.0, 82.0, 106.0, 149.0, 222.0, 278.0, 329.0, 444.0, 464.0, 437.0, 328.0, 267.0, 212.0, 157.0, 98.0, 76.0, 61.0, 41.0, 33.0, 30.0, 14.0, 5.0, 5.0, 6.0, 2.0, 1.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0], "bins": [-1.083984375, -1.0533676147460938, -1.0227508544921875, -0.9921340942382812, -0.961517333984375, -0.9309005737304688, -0.9002838134765625, -0.8696670532226562, -0.83905029296875, -0.8084335327148438, -0.7778167724609375, -0.7472000122070312, -0.716583251953125, -0.6859664916992188, -0.6553497314453125, -0.6247329711914062, -0.5941162109375, -0.5634994506835938, -0.5328826904296875, -0.5022659301757812, -0.471649169921875, -0.44103240966796875, -0.4104156494140625, -0.37979888916015625, -0.34918212890625, -0.31856536865234375, -0.2879486083984375, -0.25733184814453125, -0.226715087890625, -0.19609832763671875, -0.1654815673828125, -0.13486480712890625, -0.104248046875, -0.07363128662109375, -0.0430145263671875, -0.01239776611328125, 0.018218994140625, 0.04883575439453125, 0.0794525146484375, 0.11006927490234375, 0.14068603515625, 0.17130279541015625, 0.2019195556640625, 0.23253631591796875, 0.263153076171875, 0.29376983642578125, 0.3243865966796875, 0.35500335693359375, 0.3856201171875, 0.41623687744140625, 0.4468536376953125, 0.47747039794921875, 0.508087158203125, 0.5387039184570312, 0.5693206787109375, 0.5999374389648438, 0.63055419921875, 0.6611709594726562, 0.6917877197265625, 0.7224044799804688, 0.753021240234375, 0.7836380004882812, 0.8142547607421875, 0.8448715209960938, 0.87548828125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 8.0, 6.0, 15.0, 13.0, 27.0, 47.0, 72.0, 101.0, 117.0, 126.0, 130.0, 100.0, 83.0, 72.0, 27.0, 31.0, 19.0, 6.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.511949062347412, -5.320488929748535, -5.129029273986816, -4.9375691413879395, -4.746109485626221, -4.554649353027344, -4.363189697265625, -4.171729564666748, -3.98026967048645, -3.7888097763061523, -3.5973498821258545, -3.4058899879455566, -3.2144298553466797, -3.022970199584961, -2.831510066986084, -2.640050172805786, -2.4485902786254883, -2.2571303844451904, -2.0656704902648926, -1.8742104768753052, -1.6827505826950073, -1.4912906885147095, -1.299830675125122, -1.1083707809448242, -0.9169108867645264, -0.7254509925842285, -0.5339910387992859, -0.34253108501434326, -0.1510711908340454, 0.04038870334625244, 0.23184871673583984, 0.4233086109161377, 0.6147680282592773, 0.8062279224395752, 0.9976878762245178, 1.1891478300094604, 1.3806077241897583, 1.5720676183700562, 1.7635276317596436, 1.9549875259399414, 2.1464474201202393, 2.337907314300537, 2.529367208480835, 2.720827102661133, 2.9122872352600098, 3.1037468910217285, 3.2952070236206055, 3.4866669178009033, 3.678126811981201, 3.869586706161499, 4.061046600341797, 4.252506732940674, 4.443966388702393, 4.6354265213012695, 4.826886177062988, 5.018346309661865, 5.209806442260742, 5.401266574859619, 5.592726230621338, 5.784186363220215, 5.975646018981934, 6.1671061515808105, 6.3585662841796875, 6.550025939941406, 6.741485595703125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 2.0, 3.0, 6.0, 7.0, 6.0, 12.0, 11.0, 16.0, 13.0, 25.0, 20.0, 24.0, 28.0, 39.0, 43.0, 42.0, 39.0, 54.0, 45.0, 41.0, 34.0, 53.0, 41.0, 42.0, 38.0, 44.0, 43.0, 35.0, 35.0, 26.0, 22.0, 18.0, 17.0, 16.0, 17.0, 13.0, 8.0, 5.0, 4.0, 5.0, 4.0, 4.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8771300315856934, -2.7858071327209473, -2.6944844722747803, -2.603161573410034, -2.511838912963867, -2.420516014099121, -2.329193115234375, -2.237870454788208, -2.146547794342041, -2.055224895477295, -1.963902235031128, -1.8725793361663818, -1.7812566757202148, -1.6899337768554688, -1.5986109972000122, -1.5072882175445557, -1.4159653186798096, -1.324642539024353, -1.2333197593688965, -1.1419968605041504, -1.0506742000579834, -0.9593513607978821, -0.8680285215377808, -0.7767057418823242, -0.6853829622268677, -0.5940601825714111, -0.5027374029159546, -0.41141456365585327, -0.32009178400039673, -0.22876900434494019, -0.13744616508483887, -0.046123385429382324, 0.04519963264465332, 0.13652242720127106, 0.2278452217578888, 0.3191680312156677, 0.41049081087112427, 0.5018135905265808, 0.5931364297866821, 0.6844592094421387, 0.7757819890975952, 0.8671047687530518, 0.9584275484085083, 1.0497503280639648, 1.141073226928711, 1.232395887374878, 1.323718786239624, 1.4150415658950806, 1.506364345550537, 1.5976871252059937, 1.6890099048614502, 1.7803328037261963, 1.8716554641723633, 1.9629783630371094, 2.0543012619018555, 2.1456239223480225, 2.2369465827941895, 2.3282694816589355, 2.4195921421051025, 2.5109150409698486, 2.6022377014160156, 2.6935606002807617, 2.784883499145508, 2.876206159591675, 2.967529058456421]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 5.0, 3.0, 8.0, 22.0, 23.0, 27.0, 44.0, 52.0, 71.0, 132.0, 226.0, 354.0, 572.0, 956.0, 1746.0, 3144.0, 6207.0, 12833.0, 28790.0, 66350.0, 153648.0, 275533.0, 258096.0, 134569.0, 57170.0, 24483.0, 11215.0, 5580.0, 2920.0, 1571.0, 869.0, 495.0, 313.0, 187.0, 112.0, 73.0, 46.0, 28.0, 25.0, 23.0, 16.0, 8.0, 7.0, 3.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.44287109375, -0.42899322509765625, -0.4151153564453125, -0.40123748779296875, -0.387359619140625, -0.37348175048828125, -0.3596038818359375, -0.34572601318359375, -0.33184814453125, -0.31797027587890625, -0.3040924072265625, -0.29021453857421875, -0.276336669921875, -0.26245880126953125, -0.2485809326171875, -0.23470306396484375, -0.2208251953125, -0.20694732666015625, -0.1930694580078125, -0.17919158935546875, -0.165313720703125, -0.15143585205078125, -0.1375579833984375, -0.12368011474609375, -0.10980224609375, -0.09592437744140625, -0.0820465087890625, -0.06816864013671875, -0.054290771484375, -0.04041290283203125, -0.0265350341796875, -0.01265716552734375, 0.001220703125, 0.01509857177734375, 0.0289764404296875, 0.04285430908203125, 0.056732177734375, 0.07061004638671875, 0.0844879150390625, 0.09836578369140625, 0.11224365234375, 0.12612152099609375, 0.1399993896484375, 0.15387725830078125, 0.167755126953125, 0.18163299560546875, 0.1955108642578125, 0.20938873291015625, 0.2232666015625, 0.23714447021484375, 0.2510223388671875, 0.26490020751953125, 0.278778076171875, 0.29265594482421875, 0.3065338134765625, 0.32041168212890625, 0.33428955078125, 0.34816741943359375, 0.3620452880859375, 0.37592315673828125, 0.389801025390625, 0.40367889404296875, 0.4175567626953125, 0.43143463134765625, 0.4453125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 3.0, 5.0, 8.0, 9.0, 12.0, 22.0, 21.0, 25.0, 30.0, 43.0, 34.0, 52.0, 62.0, 58.0, 55.0, 61.0, 43.0, 59.0, 70.0, 55.0, 39.0, 52.0, 38.0, 28.0, 24.0, 21.0, 10.0, 18.0, 10.0, 8.0, 11.0, 6.0, 3.0, 5.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.548828125, -2.467010498046875, -2.38519287109375, -2.303375244140625, -2.2215576171875, -2.139739990234375, -2.05792236328125, -1.976104736328125, -1.894287109375, -1.812469482421875, -1.73065185546875, -1.648834228515625, -1.5670166015625, -1.485198974609375, -1.40338134765625, -1.321563720703125, -1.23974609375, -1.157928466796875, -1.07611083984375, -0.994293212890625, -0.9124755859375, -0.830657958984375, -0.74884033203125, -0.667022705078125, -0.585205078125, -0.503387451171875, -0.42156982421875, -0.339752197265625, -0.2579345703125, -0.176116943359375, -0.09429931640625, -0.012481689453125, 0.0693359375, 0.151153564453125, 0.23297119140625, 0.314788818359375, 0.3966064453125, 0.478424072265625, 0.56024169921875, 0.642059326171875, 0.723876953125, 0.805694580078125, 0.88751220703125, 0.969329833984375, 1.0511474609375, 1.132965087890625, 1.21478271484375, 1.296600341796875, 1.37841796875, 1.460235595703125, 1.54205322265625, 1.623870849609375, 1.7056884765625, 1.787506103515625, 1.86932373046875, 1.951141357421875, 2.032958984375, 2.114776611328125, 2.19659423828125, 2.278411865234375, 2.3602294921875, 2.442047119140625, 2.52386474609375, 2.605682373046875, 2.6875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 6.0, 4.0, 6.0, 9.0, 5.0, 11.0, 21.0, 21.0, 39.0, 61.0, 77.0, 147.0, 204.0, 332.0, 484.0, 741.0, 1201.0, 1873.0, 3055.0, 5017.0, 8202.0, 13491.0, 23394.0, 40524.0, 67484.0, 110160.0, 160717.0, 186401.0, 158030.0, 106512.0, 65031.0, 38272.0, 22630.0, 13485.0, 8028.0, 4730.0, 2931.0, 1900.0, 1168.0, 729.0, 517.0, 295.0, 206.0, 132.0, 79.0, 61.0, 48.0, 28.0, 18.0, 14.0, 8.0, 8.0, 9.0, 2.0, 5.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0], "bins": [-0.2294921875, -0.22195816040039062, -0.21442413330078125, -0.20689010620117188, -0.1993560791015625, -0.19182205200195312, -0.18428802490234375, -0.17675399780273438, -0.169219970703125, -0.16168594360351562, -0.15415191650390625, -0.14661788940429688, -0.1390838623046875, -0.13154983520507812, -0.12401580810546875, -0.11648178100585938, -0.10894775390625, -0.10141372680664062, -0.09387969970703125, -0.08634567260742188, -0.0788116455078125, -0.07127761840820312, -0.06374359130859375, -0.056209564208984375, -0.048675537109375, -0.041141510009765625, -0.03360748291015625, -0.026073455810546875, -0.0185394287109375, -0.011005401611328125, -0.00347137451171875, 0.004062652587890625, 0.0115966796875, 0.019130706787109375, 0.02666473388671875, 0.034198760986328125, 0.0417327880859375, 0.049266815185546875, 0.05680084228515625, 0.06433486938476562, 0.071868896484375, 0.07940292358398438, 0.08693695068359375, 0.09447097778320312, 0.1020050048828125, 0.10953903198242188, 0.11707305908203125, 0.12460708618164062, 0.13214111328125, 0.13967514038085938, 0.14720916748046875, 0.15474319458007812, 0.1622772216796875, 0.16981124877929688, 0.17734527587890625, 0.18487930297851562, 0.192413330078125, 0.19994735717773438, 0.20748138427734375, 0.21501541137695312, 0.2225494384765625, 0.23008346557617188, 0.23761749267578125, 0.24515151977539062, 0.252685546875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 7.0, 9.0, 4.0, 9.0, 13.0, 15.0, 16.0, 19.0, 19.0, 34.0, 38.0, 40.0, 45.0, 49.0, 34.0, 55.0, 66.0, 53.0, 73.0, 61.0, 48.0, 46.0, 41.0, 25.0, 38.0, 36.0, 22.0, 17.0, 6.0, 14.0, 12.0, 5.0, 15.0, 5.0, 4.0, 2.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.37109375, -4.22637939453125, -4.0816650390625, -3.93695068359375, -3.792236328125, -3.64752197265625, -3.5028076171875, -3.35809326171875, -3.21337890625, -3.06866455078125, -2.9239501953125, -2.77923583984375, -2.634521484375, -2.48980712890625, -2.3450927734375, -2.20037841796875, -2.0556640625, -1.91094970703125, -1.7662353515625, -1.62152099609375, -1.476806640625, -1.33209228515625, -1.1873779296875, -1.04266357421875, -0.89794921875, -0.75323486328125, -0.6085205078125, -0.46380615234375, -0.319091796875, -0.17437744140625, -0.0296630859375, 0.11505126953125, 0.259765625, 0.40447998046875, 0.5491943359375, 0.69390869140625, 0.838623046875, 0.98333740234375, 1.1280517578125, 1.27276611328125, 1.41748046875, 1.56219482421875, 1.7069091796875, 1.85162353515625, 1.996337890625, 2.14105224609375, 2.2857666015625, 2.43048095703125, 2.5751953125, 2.71990966796875, 2.8646240234375, 3.00933837890625, 3.154052734375, 3.29876708984375, 3.4434814453125, 3.58819580078125, 3.73291015625, 3.87762451171875, 4.0223388671875, 4.16705322265625, 4.311767578125, 4.45648193359375, 4.6011962890625, 4.74591064453125, 4.890625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 6.0, 6.0, 5.0, 8.0, 9.0, 22.0, 24.0, 36.0, 40.0, 75.0, 97.0, 104.0, 168.0, 261.0, 376.0, 588.0, 1026.0, 1775.0, 3116.0, 6365.0, 13612.0, 30505.0, 69323.0, 156522.0, 305313.0, 251205.0, 114324.0, 50166.0, 22395.0, 10122.0, 4784.0, 2453.0, 1359.0, 797.0, 513.0, 325.0, 209.0, 139.0, 116.0, 80.0, 59.0, 40.0, 19.0, 22.0, 18.0, 13.0, 4.0, 7.0, 7.0, 4.0, 3.0, 3.0, 0.0, 2.0], "bins": [-0.050537109375, -0.049085140228271484, -0.04763317108154297, -0.04618120193481445, -0.04472923278808594, -0.04327726364135742, -0.041825294494628906, -0.04037332534790039, -0.038921356201171875, -0.03746938705444336, -0.036017417907714844, -0.03456544876098633, -0.03311347961425781, -0.0316615104675293, -0.03020954132080078, -0.028757572174072266, -0.02730560302734375, -0.025853633880615234, -0.02440166473388672, -0.022949695587158203, -0.021497726440429688, -0.020045757293701172, -0.018593788146972656, -0.01714181900024414, -0.015689849853515625, -0.01423788070678711, -0.012785911560058594, -0.011333942413330078, -0.009881973266601562, -0.008430004119873047, -0.006978034973144531, -0.005526065826416016, -0.0040740966796875, -0.0026221275329589844, -0.0011701583862304688, 0.0002818107604980469, 0.0017337799072265625, 0.003185749053955078, 0.004637718200683594, 0.006089687347412109, 0.007541656494140625, 0.00899362564086914, 0.010445594787597656, 0.011897563934326172, 0.013349533081054688, 0.014801502227783203, 0.01625347137451172, 0.017705440521240234, 0.01915740966796875, 0.020609378814697266, 0.02206134796142578, 0.023513317108154297, 0.024965286254882812, 0.026417255401611328, 0.027869224548339844, 0.02932119369506836, 0.030773162841796875, 0.03222513198852539, 0.033677101135253906, 0.03512907028198242, 0.03658103942871094, 0.03803300857543945, 0.03948497772216797, 0.040936946868896484, 0.042388916015625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 9.0, 2.0, 14.0, 27.0, 28.0, 54.0, 61.0, 77.0, 118.0, 160.0, 105.0, 91.0, 83.0, 55.0, 36.0, 23.0, 24.0, 8.0, 10.0, 9.0, 7.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.413459777832031e-05, -6.196461617946625e-05, -5.979463458061218e-05, -5.762465298175812e-05, -5.545467138290405e-05, -5.328468978404999e-05, -5.111470818519592e-05, -4.894472658634186e-05, -4.677474498748779e-05, -4.460476338863373e-05, -4.243478178977966e-05, -4.02648001909256e-05, -3.809481859207153e-05, -3.592483699321747e-05, -3.37548553943634e-05, -3.158487379550934e-05, -2.9414892196655273e-05, -2.724491059780121e-05, -2.5074928998947144e-05, -2.290494740009308e-05, -2.0734965801239014e-05, -1.856498420238495e-05, -1.6395002603530884e-05, -1.4225021004676819e-05, -1.2055039405822754e-05, -9.885057806968689e-06, -7.715076208114624e-06, -5.545094609260559e-06, -3.375113010406494e-06, -1.2051314115524292e-06, 9.648501873016357e-07, 3.1348317861557007e-06, 5.304813385009766e-06, 7.4747949838638306e-06, 9.644776582717896e-06, 1.181475818157196e-05, 1.3984739780426025e-05, 1.615472137928009e-05, 1.8324702978134155e-05, 2.049468457698822e-05, 2.2664666175842285e-05, 2.483464777469635e-05, 2.7004629373550415e-05, 2.917461097240448e-05, 3.1344592571258545e-05, 3.351457417011261e-05, 3.5684555768966675e-05, 3.785453736782074e-05, 4.0024518966674805e-05, 4.219450056552887e-05, 4.4364482164382935e-05, 4.6534463763237e-05, 4.8704445362091064e-05, 5.087442696094513e-05, 5.3044408559799194e-05, 5.521439015865326e-05, 5.7384371757507324e-05, 5.955435335636139e-05, 6.172433495521545e-05, 6.389431655406952e-05, 6.606429815292358e-05, 6.823427975177765e-05, 7.040426135063171e-05, 7.257424294948578e-05, 7.474422454833984e-05]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 6.0, 2.0, 5.0, 9.0, 8.0, 17.0, 11.0, 22.0, 34.0, 35.0, 66.0, 76.0, 100.0, 146.0, 275.0, 518.0, 1115.0, 2315.0, 5406.0, 13584.0, 34173.0, 87625.0, 229940.0, 368730.0, 185153.0, 71345.0, 27986.0, 11228.0, 4555.0, 1939.0, 928.0, 422.0, 264.0, 154.0, 98.0, 70.0, 53.0, 40.0, 34.0, 24.0, 15.0, 9.0, 6.0, 5.0, 3.0, 4.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.04681396484375, -0.04522085189819336, -0.04362773895263672, -0.04203462600708008, -0.04044151306152344, -0.0388484001159668, -0.037255287170410156, -0.035662174224853516, -0.034069061279296875, -0.032475948333740234, -0.030882835388183594, -0.029289722442626953, -0.027696609497070312, -0.026103496551513672, -0.02451038360595703, -0.02291727066040039, -0.02132415771484375, -0.01973104476928711, -0.01813793182373047, -0.016544818878173828, -0.014951705932617188, -0.013358592987060547, -0.011765480041503906, -0.010172367095947266, -0.008579254150390625, -0.006986141204833984, -0.005393028259277344, -0.003799915313720703, -0.0022068023681640625, -0.0006136894226074219, 0.0009794235229492188, 0.0025725364685058594, 0.0041656494140625, 0.005758762359619141, 0.007351875305175781, 0.008944988250732422, 0.010538101196289062, 0.012131214141845703, 0.013724327087402344, 0.015317440032958984, 0.016910552978515625, 0.018503665924072266, 0.020096778869628906, 0.021689891815185547, 0.023283004760742188, 0.024876117706298828, 0.02646923065185547, 0.02806234359741211, 0.02965545654296875, 0.03124856948852539, 0.03284168243408203, 0.03443479537963867, 0.03602790832519531, 0.03762102127075195, 0.039214134216308594, 0.040807247161865234, 0.042400360107421875, 0.043993473052978516, 0.045586585998535156, 0.0471796989440918, 0.04877281188964844, 0.05036592483520508, 0.05195903778076172, 0.05355215072631836, 0.055145263671875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 3.0, 4.0, 7.0, 11.0, 13.0, 14.0, 23.0, 23.0, 28.0, 38.0, 43.0, 64.0, 63.0, 78.0, 88.0, 58.0, 70.0, 57.0, 59.0, 38.0, 36.0, 34.0, 18.0, 27.0, 20.0, 16.0, 14.0, 6.0, 8.0, 8.0, 6.0, 6.0, 2.0, 7.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01519012451171875, -0.014665961265563965, -0.01414179801940918, -0.013617634773254395, -0.01309347152709961, -0.012569308280944824, -0.012045145034790039, -0.011520981788635254, -0.010996818542480469, -0.010472655296325684, -0.009948492050170898, -0.009424328804016113, -0.008900165557861328, -0.008376002311706543, -0.007851839065551758, -0.007327675819396973, -0.0068035125732421875, -0.006279349327087402, -0.005755186080932617, -0.005231022834777832, -0.004706859588623047, -0.004182696342468262, -0.0036585330963134766, -0.0031343698501586914, -0.0026102066040039062, -0.002086043357849121, -0.001561880111694336, -0.0010377168655395508, -0.0005135536193847656, 1.0609626770019531e-05, 0.0005347728729248047, 0.0010589361190795898, 0.001583099365234375, 0.00210726261138916, 0.0026314258575439453, 0.0031555891036987305, 0.0036797523498535156, 0.004203915596008301, 0.004728078842163086, 0.005252242088317871, 0.005776405334472656, 0.006300568580627441, 0.0068247318267822266, 0.007348895072937012, 0.007873058319091797, 0.008397221565246582, 0.008921384811401367, 0.009445548057556152, 0.009969711303710938, 0.010493874549865723, 0.011018037796020508, 0.011542201042175293, 0.012066364288330078, 0.012590527534484863, 0.013114690780639648, 0.013638854026794434, 0.014163017272949219, 0.014687180519104004, 0.015211343765258789, 0.015735507011413574, 0.01625967025756836, 0.016783833503723145, 0.01730799674987793, 0.017832159996032715, 0.0183563232421875]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 44.0, 294.0, 519.0, 136.0, 16.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.308990478515625, -12.782543182373047, -12.256094932556152, -11.729646682739258, -11.20319938659668, -10.676752090454102, -10.150303840637207, -9.623855590820312, -9.097408294677734, -8.570960998535156, -8.044512748718262, -7.518064975738525, -6.991617202758789, -6.465169429779053, -5.938721656799316, -5.41227388381958, -4.885826110839844, -4.359378337860107, -3.832930564880371, -3.3064827919006348, -2.7800350189208984, -2.253587245941162, -1.7271394729614258, -1.2006916999816895, -0.6742439270019531, -0.1477961540222168, 0.37865161895751953, 0.9050993919372559, 1.4315471649169922, 1.9579949378967285, 2.484442710876465, 3.010890483856201, 3.5373382568359375, 4.063786029815674, 4.59023380279541, 5.1166815757751465, 5.643129348754883, 6.169577121734619, 6.6960248947143555, 7.222472667694092, 7.748920440673828, 8.275367736816406, 8.8018159866333, 9.328264236450195, 9.854711532592773, 10.381158828735352, 10.907607078552246, 11.43405532836914, 11.960502624511719, 12.486949920654297, 13.013398170471191, 13.539846420288086, 14.066293716430664, 14.592741012573242, 15.119189262390137, 15.645637512207031, 16.17208480834961, 16.698532104492188, 17.224979400634766, 17.751428604125977, 18.277875900268555, 18.804323196411133, 19.330772399902344, 19.857219696044922, 20.3836669921875]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 5.0, 2.0, 4.0, 4.0, 8.0, 2.0, 16.0, 7.0, 19.0, 23.0, 25.0, 32.0, 31.0, 49.0, 55.0, 54.0, 54.0, 56.0, 50.0, 55.0, 54.0, 57.0, 49.0, 49.0, 46.0, 43.0, 28.0, 22.0, 23.0, 20.0, 21.0, 14.0, 4.0, 10.0, 5.0, 3.0, 6.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2922892570495605, -2.2165064811706543, -2.140723705291748, -2.0649406909942627, -1.9891579151153564, -1.9133751392364502, -1.837592363357544, -1.7618095874786377, -1.686026692390442, -1.6102439165115356, -1.5344610214233398, -1.4586782455444336, -1.3828954696655273, -1.3071125745773315, -1.2313297986984253, -1.1555469036102295, -1.0797641277313232, -1.003981351852417, -0.9281984567642212, -0.8524156808853149, -0.7766328454017639, -0.7008500099182129, -0.6250672340393066, -0.5492843985557556, -0.4735015630722046, -0.39771872758865356, -0.3219359219074249, -0.2461531013250351, -0.17037028074264526, -0.09458744525909424, -0.0188046395778656, 0.05697816610336304, 0.13276100158691406, 0.2085438221693039, 0.2843266427516937, 0.36010944843292236, 0.4358922839164734, 0.5116751194000244, 0.5874578952789307, 0.6632407307624817, 0.7390235662460327, 0.8148064017295837, 0.8905892372131348, 0.966372013092041, 1.0421547889709473, 1.117937684059143, 1.1937204599380493, 1.2695033550262451, 1.3452861309051514, 1.4210689067840576, 1.4968518018722534, 1.5726345777511597, 1.6484174728393555, 1.7242002487182617, 1.799983024597168, 1.8757658004760742, 1.95154869556427, 2.027331590652466, 2.103114366531372, 2.1788971424102783, 2.2546799182891846, 2.33046293258667, 2.406245708465576, 2.4820284843444824, 2.5578112602233887]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 1.0, 1.0, 4.0, 7.0, 5.0, 18.0, 15.0, 21.0, 27.0, 41.0, 65.0, 131.0, 358.0, 1462.0, 11502.0, 188477.0, 725308.0, 112298.0, 7107.0, 1142.0, 267.0, 123.0, 51.0, 47.0, 16.0, 10.0, 13.0, 13.0, 8.0, 4.0, 7.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.23046875, -4.08154296875, -3.9326171875, -3.78369140625, -3.634765625, -3.48583984375, -3.3369140625, -3.18798828125, -3.0390625, -2.89013671875, -2.7412109375, -2.59228515625, -2.443359375, -2.29443359375, -2.1455078125, -1.99658203125, -1.84765625, -1.69873046875, -1.5498046875, -1.40087890625, -1.251953125, -1.10302734375, -0.9541015625, -0.80517578125, -0.65625, -0.50732421875, -0.3583984375, -0.20947265625, -0.060546875, 0.08837890625, 0.2373046875, 0.38623046875, 0.53515625, 0.68408203125, 0.8330078125, 0.98193359375, 1.130859375, 1.27978515625, 1.4287109375, 1.57763671875, 1.7265625, 1.87548828125, 2.0244140625, 2.17333984375, 2.322265625, 2.47119140625, 2.6201171875, 2.76904296875, 2.91796875, 3.06689453125, 3.2158203125, 3.36474609375, 3.513671875, 3.66259765625, 3.8115234375, 3.96044921875, 4.109375, 4.25830078125, 4.4072265625, 4.55615234375, 4.705078125, 4.85400390625, 5.0029296875, 5.15185546875, 5.30078125]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 4.0, 6.0, 3.0, 5.0, 8.0, 10.0, 9.0, 19.0, 19.0, 29.0, 29.0, 40.0, 31.0, 49.0, 55.0, 59.0, 56.0, 67.0, 55.0, 56.0, 49.0, 53.0, 44.0, 54.0, 29.0, 29.0, 25.0, 20.0, 24.0, 12.0, 20.0, 11.0, 13.0, 6.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.8125, -4.667724609375, -4.52294921875, -4.378173828125, -4.2333984375, -4.088623046875, -3.94384765625, -3.799072265625, -3.654296875, -3.509521484375, -3.36474609375, -3.219970703125, -3.0751953125, -2.930419921875, -2.78564453125, -2.640869140625, -2.49609375, -2.351318359375, -2.20654296875, -2.061767578125, -1.9169921875, -1.772216796875, -1.62744140625, -1.482666015625, -1.337890625, -1.193115234375, -1.04833984375, -0.903564453125, -0.7587890625, -0.614013671875, -0.46923828125, -0.324462890625, -0.1796875, -0.034912109375, 0.10986328125, 0.254638671875, 0.3994140625, 0.544189453125, 0.68896484375, 0.833740234375, 0.978515625, 1.123291015625, 1.26806640625, 1.412841796875, 1.5576171875, 1.702392578125, 1.84716796875, 1.991943359375, 2.13671875, 2.281494140625, 2.42626953125, 2.571044921875, 2.7158203125, 2.860595703125, 3.00537109375, 3.150146484375, 3.294921875, 3.439697265625, 3.58447265625, 3.729248046875, 3.8740234375, 4.018798828125, 4.16357421875, 4.308349609375, 4.453125]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 3.0, 3.0, 3.0, 10.0, 9.0, 12.0, 12.0, 18.0, 23.0, 42.0, 56.0, 73.0, 114.0, 138.0, 202.0, 392.0, 1211.0, 10758.0, 410146.0, 605501.0, 16993.0, 1562.0, 451.0, 238.0, 154.0, 125.0, 82.0, 65.0, 52.0, 29.0, 23.0, 18.0, 12.0, 5.0, 3.0, 6.0, 2.0, 3.0, 5.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.13671875, -5.951171875, -5.765625, -5.580078125, -5.39453125, -5.208984375, -5.0234375, -4.837890625, -4.65234375, -4.466796875, -4.28125, -4.095703125, -3.91015625, -3.724609375, -3.5390625, -3.353515625, -3.16796875, -2.982421875, -2.796875, -2.611328125, -2.42578125, -2.240234375, -2.0546875, -1.869140625, -1.68359375, -1.498046875, -1.3125, -1.126953125, -0.94140625, -0.755859375, -0.5703125, -0.384765625, -0.19921875, -0.013671875, 0.171875, 0.357421875, 0.54296875, 0.728515625, 0.9140625, 1.099609375, 1.28515625, 1.470703125, 1.65625, 1.841796875, 2.02734375, 2.212890625, 2.3984375, 2.583984375, 2.76953125, 2.955078125, 3.140625, 3.326171875, 3.51171875, 3.697265625, 3.8828125, 4.068359375, 4.25390625, 4.439453125, 4.625, 4.810546875, 4.99609375, 5.181640625, 5.3671875, 5.552734375, 5.73828125]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 3.0, 6.0, 3.0, 14.0, 5.0, 16.0, 12.0, 28.0, 21.0, 21.0, 39.0, 40.0, 44.0, 47.0, 43.0, 48.0, 51.0, 43.0, 43.0, 60.0, 44.0, 41.0, 39.0, 37.0, 37.0, 35.0, 41.0, 20.0, 30.0, 22.0, 14.0, 14.0, 11.0, 8.0, 5.0, 6.0, 6.0, 3.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.30859375, -5.15606689453125, -5.0035400390625, -4.85101318359375, -4.698486328125, -4.54595947265625, -4.3934326171875, -4.24090576171875, -4.08837890625, -3.93585205078125, -3.7833251953125, -3.63079833984375, -3.478271484375, -3.32574462890625, -3.1732177734375, -3.02069091796875, -2.8681640625, -2.71563720703125, -2.5631103515625, -2.41058349609375, -2.258056640625, -2.10552978515625, -1.9530029296875, -1.80047607421875, -1.64794921875, -1.49542236328125, -1.3428955078125, -1.19036865234375, -1.037841796875, -0.88531494140625, -0.7327880859375, -0.58026123046875, -0.427734375, -0.27520751953125, -0.1226806640625, 0.02984619140625, 0.182373046875, 0.33489990234375, 0.4874267578125, 0.63995361328125, 0.79248046875, 0.94500732421875, 1.0975341796875, 1.25006103515625, 1.402587890625, 1.55511474609375, 1.7076416015625, 1.86016845703125, 2.0126953125, 2.16522216796875, 2.3177490234375, 2.47027587890625, 2.622802734375, 2.77532958984375, 2.9278564453125, 3.08038330078125, 3.23291015625, 3.38543701171875, 3.5379638671875, 3.69049072265625, 3.843017578125, 3.99554443359375, 4.1480712890625, 4.30059814453125, 4.453125]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 10.0, 10.0, 12.0, 19.0, 47.0, 81.0, 225.0, 935.0, 8003.0, 665544.0, 366529.0, 5966.0, 790.0, 200.0, 77.0, 42.0, 29.0, 12.0, 10.0, 4.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6875, -3.5643310546875, -3.441162109375, -3.3179931640625, -3.19482421875, -3.0716552734375, -2.948486328125, -2.8253173828125, -2.7021484375, -2.5789794921875, -2.455810546875, -2.3326416015625, -2.20947265625, -2.0863037109375, -1.963134765625, -1.8399658203125, -1.716796875, -1.5936279296875, -1.470458984375, -1.3472900390625, -1.22412109375, -1.1009521484375, -0.977783203125, -0.8546142578125, -0.7314453125, -0.6082763671875, -0.485107421875, -0.3619384765625, -0.23876953125, -0.1156005859375, 0.007568359375, 0.1307373046875, 0.25390625, 0.3770751953125, 0.500244140625, 0.6234130859375, 0.74658203125, 0.8697509765625, 0.992919921875, 1.1160888671875, 1.2392578125, 1.3624267578125, 1.485595703125, 1.6087646484375, 1.73193359375, 1.8551025390625, 1.978271484375, 2.1014404296875, 2.224609375, 2.3477783203125, 2.470947265625, 2.5941162109375, 2.71728515625, 2.8404541015625, 2.963623046875, 3.0867919921875, 3.2099609375, 3.3331298828125, 3.456298828125, 3.5794677734375, 3.70263671875, 3.8258056640625, 3.948974609375, 4.0721435546875, 4.1953125]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 5.0, 4.0, 3.0, 2.0, 6.0, 8.0, 11.0, 6.0, 13.0, 19.0, 32.0, 28.0, 43.0, 49.0, 57.0, 78.0, 120.0, 96.0, 86.0, 66.0, 58.0, 43.0, 36.0, 31.0, 29.0, 18.0, 16.0, 8.0, 4.0, 8.0, 3.0, 5.0, 0.0, 2.0, 0.0, 2.0, 5.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00018155574798583984, -0.00017639808356761932, -0.0001712404191493988, -0.00016608275473117828, -0.00016092509031295776, -0.00015576742589473724, -0.00015060976147651672, -0.0001454520970582962, -0.00014029443264007568, -0.00013513676822185516, -0.00012997910380363464, -0.00012482143938541412, -0.0001196637749671936, -0.00011450611054897308, -0.00010934844613075256, -0.00010419078171253204, -9.903311729431152e-05, -9.3875452876091e-05, -8.871778845787048e-05, -8.356012403964996e-05, -7.840245962142944e-05, -7.324479520320892e-05, -6.80871307849884e-05, -6.292946636676788e-05, -5.777180194854736e-05, -5.261413753032684e-05, -4.745647311210632e-05, -4.22988086938858e-05, -3.714114427566528e-05, -3.198347985744476e-05, -2.6825815439224243e-05, -2.1668151021003723e-05, -1.6510486602783203e-05, -1.1352822184562683e-05, -6.195157766342163e-06, -1.037493348121643e-06, 4.120171070098877e-06, 9.277835488319397e-06, 1.4435499906539917e-05, 1.9593164324760437e-05, 2.4750828742980957e-05, 2.9908493161201477e-05, 3.5066157579422e-05, 4.022382199764252e-05, 4.538148641586304e-05, 5.053915083408356e-05, 5.569681525230408e-05, 6.08544796705246e-05, 6.601214408874512e-05, 7.116980850696564e-05, 7.632747292518616e-05, 8.148513734340668e-05, 8.66428017616272e-05, 9.180046617984772e-05, 9.695813059806824e-05, 0.00010211579501628876, 0.00010727345943450928, 0.0001124311238527298, 0.00011758878827095032, 0.00012274645268917084, 0.00012790411710739136, 0.00013306178152561188, 0.0001382194459438324, 0.00014337711036205292, 0.00014853477478027344]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 7.0, 13.0, 17.0, 18.0, 29.0, 45.0, 74.0, 160.0, 408.0, 2001.0, 31727.0, 968659.0, 42193.0, 2377.0, 460.0, 174.0, 78.0, 38.0, 33.0, 18.0, 10.0, 6.0, 6.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0703125, -2.95458984375, -2.8388671875, -2.72314453125, -2.607421875, -2.49169921875, -2.3759765625, -2.26025390625, -2.14453125, -2.02880859375, -1.9130859375, -1.79736328125, -1.681640625, -1.56591796875, -1.4501953125, -1.33447265625, -1.21875, -1.10302734375, -0.9873046875, -0.87158203125, -0.755859375, -0.64013671875, -0.5244140625, -0.40869140625, -0.29296875, -0.17724609375, -0.0615234375, 0.05419921875, 0.169921875, 0.28564453125, 0.4013671875, 0.51708984375, 0.6328125, 0.74853515625, 0.8642578125, 0.97998046875, 1.095703125, 1.21142578125, 1.3271484375, 1.44287109375, 1.55859375, 1.67431640625, 1.7900390625, 1.90576171875, 2.021484375, 2.13720703125, 2.2529296875, 2.36865234375, 2.484375, 2.60009765625, 2.7158203125, 2.83154296875, 2.947265625, 3.06298828125, 3.1787109375, 3.29443359375, 3.41015625, 3.52587890625, 3.6416015625, 3.75732421875, 3.873046875, 3.98876953125, 4.1044921875, 4.22021484375, 4.3359375]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 6.0, 8.0, 13.0, 14.0, 18.0, 37.0, 46.0, 68.0, 98.0, 100.0, 120.0, 113.0, 90.0, 89.0, 51.0, 41.0, 30.0, 14.0, 6.0, 12.0, 11.0, 4.0, 6.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.7724609375, -0.7520523071289062, -0.7316436767578125, -0.7112350463867188, -0.690826416015625, -0.6704177856445312, -0.6500091552734375, -0.6296005249023438, -0.60919189453125, -0.5887832641601562, -0.5683746337890625, -0.5479660034179688, -0.527557373046875, -0.5071487426757812, -0.4867401123046875, -0.46633148193359375, -0.4459228515625, -0.42551422119140625, -0.4051055908203125, -0.38469696044921875, -0.364288330078125, -0.34387969970703125, -0.3234710693359375, -0.30306243896484375, -0.28265380859375, -0.26224517822265625, -0.2418365478515625, -0.22142791748046875, -0.201019287109375, -0.18061065673828125, -0.1602020263671875, -0.13979339599609375, -0.119384765625, -0.09897613525390625, -0.0785675048828125, -0.05815887451171875, -0.037750244140625, -0.01734161376953125, 0.0030670166015625, 0.02347564697265625, 0.04388427734375, 0.06429290771484375, 0.0847015380859375, 0.10511016845703125, 0.125518798828125, 0.14592742919921875, 0.1663360595703125, 0.18674468994140625, 0.2071533203125, 0.22756195068359375, 0.2479705810546875, 0.26837921142578125, 0.288787841796875, 0.30919647216796875, 0.3296051025390625, 0.35001373291015625, 0.37042236328125, 0.39083099365234375, 0.4112396240234375, 0.43164825439453125, 0.452056884765625, 0.47246551513671875, 0.4928741455078125, 0.5132827758789062, 0.53369140625]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 2.0, 5.0, 15.0, 23.0, 48.0, 65.0, 108.0, 154.0, 190.0, 151.0, 106.0, 66.0, 33.0, 20.0, 10.0, 8.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.412341117858887, -5.099510669708252, -4.786680221557617, -4.473849773406982, -4.161019325256348, -3.848189115524292, -3.5353589057922363, -3.2225284576416016, -2.909698009490967, -2.596867561340332, -2.2840371131896973, -1.9712069034576416, -1.6583764553070068, -1.345546007156372, -1.0327156782150269, -0.7198853492736816, -0.4070549011230469, -0.09422451257705688, 0.2186058759689331, 0.5314362645149231, 0.8442666530609131, 1.1570971012115479, 1.469927430152893, 1.7827577590942383, 2.095588207244873, 2.408418655395508, 2.7212491035461426, 3.0340793132781982, 3.346909761428833, 3.6597402095794678, 3.9725704193115234, 4.285400867462158, 4.598230361938477, 4.911060810089111, 5.223891258239746, 5.536721706390381, 5.849552154541016, 6.162382125854492, 6.475212574005127, 6.788043022155762, 7.1008734703063965, 7.413703918457031, 7.726534366607666, 8.0393648147583, 8.352194786071777, 8.66502571105957, 8.977855682373047, 9.290685653686523, 9.603516578674316, 9.916346549987793, 10.229177474975586, 10.542007446289062, 10.854838371276855, 11.167668342590332, 11.480499267578125, 11.793329238891602, 12.106159210205078, 12.418989181518555, 12.731820106506348, 13.044650077819824, 13.357481002807617, 13.670310974121094, 13.983141899108887, 14.295971870422363, 14.608802795410156]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 2.0, 3.0, 6.0, 6.0, 3.0, 6.0, 9.0, 6.0, 7.0, 13.0, 13.0, 21.0, 18.0, 15.0, 30.0, 16.0, 27.0, 28.0, 30.0, 31.0, 48.0, 38.0, 39.0, 42.0, 38.0, 36.0, 41.0, 41.0, 31.0, 37.0, 42.0, 28.0, 31.0, 34.0, 26.0, 25.0, 16.0, 28.0, 21.0, 13.0, 10.0, 8.0, 12.0, 12.0, 4.0, 5.0, 4.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0], "bins": [-6.989990234375, -6.780808448791504, -6.571626663208008, -6.362444877624512, -6.153263092041016, -5.9440813064575195, -5.734899520874023, -5.525717735290527, -5.316535949707031, -5.107354164123535, -4.898172378540039, -4.688990592956543, -4.479808807373047, -4.270627021789551, -4.061445236206055, -3.8522634506225586, -3.6430819034576416, -3.4339001178741455, -3.2247183322906494, -3.0155365467071533, -2.8063547611236572, -2.5971732139587402, -2.387991428375244, -2.178809642791748, -1.9696277379989624, -1.7604459524154663, -1.5512641668319702, -1.3420825004577637, -1.1329007148742676, -0.9237189292907715, -0.7145371437072754, -0.5053553581237793, -0.2961735725402832, -0.0869918018579483, 0.1221899688243866, 0.3313717246055603, 0.5405535101890564, 0.7497352361679077, 0.9589170217514038, 1.1680988073349, 1.377280592918396, 1.586462378501892, 1.7956441640853882, 2.0048258304595947, 2.214007616043091, 2.423189401626587, 2.632371187210083, 2.841552972793579, 3.050734758377075, 3.2599165439605713, 3.4690983295440674, 3.6782801151275635, 3.8874619007110596, 4.096643447875977, 4.305825233459473, 4.515007019042969, 4.724188804626465, 4.933370590209961, 5.142552375793457, 5.351734161376953, 5.560915946960449, 5.770097732543945, 5.979279518127441, 6.1884613037109375, 6.397643089294434]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 8.0, 15.0, 18.0, 28.0, 56.0, 83.0, 145.0, 291.0, 500.0, 1473.0, 14835.0, 1133063.0, 2995897.0, 44668.0, 2202.0, 524.0, 200.0, 94.0, 65.0, 39.0, 26.0, 16.0, 11.0, 8.0, 6.0, 5.0, 7.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.8984375, -6.6241455078125, -6.349853515625, -6.0755615234375, -5.80126953125, -5.5269775390625, -5.252685546875, -4.9783935546875, -4.7041015625, -4.4298095703125, -4.155517578125, -3.8812255859375, -3.60693359375, -3.3326416015625, -3.058349609375, -2.7840576171875, -2.509765625, -2.2354736328125, -1.961181640625, -1.6868896484375, -1.41259765625, -1.1383056640625, -0.864013671875, -0.5897216796875, -0.3154296875, -0.0411376953125, 0.233154296875, 0.5074462890625, 0.78173828125, 1.0560302734375, 1.330322265625, 1.6046142578125, 1.87890625, 2.1531982421875, 2.427490234375, 2.7017822265625, 2.97607421875, 3.2503662109375, 3.524658203125, 3.7989501953125, 4.0732421875, 4.3475341796875, 4.621826171875, 4.8961181640625, 5.17041015625, 5.4447021484375, 5.718994140625, 5.9932861328125, 6.267578125, 6.5418701171875, 6.816162109375, 7.0904541015625, 7.36474609375, 7.6390380859375, 7.913330078125, 8.1876220703125, 8.4619140625, 8.7362060546875, 9.010498046875, 9.2847900390625, 9.55908203125, 9.8333740234375, 10.107666015625, 10.3819580078125, 10.65625]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 4.0, 2.0, 4.0, 2.0, 4.0, 5.0, 7.0, 14.0, 19.0, 24.0, 28.0, 38.0, 25.0, 41.0, 49.0, 42.0, 59.0, 54.0, 61.0, 48.0, 48.0, 51.0, 52.0, 56.0, 38.0, 34.0, 29.0, 36.0, 15.0, 19.0, 23.0, 19.0, 14.0, 10.0, 12.0, 4.0, 5.0, 3.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.544921875, -2.45587158203125, -2.3668212890625, -2.27777099609375, -2.188720703125, -2.09967041015625, -2.0106201171875, -1.92156982421875, -1.83251953125, -1.74346923828125, -1.6544189453125, -1.56536865234375, -1.476318359375, -1.38726806640625, -1.2982177734375, -1.20916748046875, -1.1201171875, -1.03106689453125, -0.9420166015625, -0.85296630859375, -0.763916015625, -0.67486572265625, -0.5858154296875, -0.49676513671875, -0.40771484375, -0.31866455078125, -0.2296142578125, -0.14056396484375, -0.051513671875, 0.03753662109375, 0.1265869140625, 0.21563720703125, 0.3046875, 0.39373779296875, 0.4827880859375, 0.57183837890625, 0.660888671875, 0.74993896484375, 0.8389892578125, 0.92803955078125, 1.01708984375, 1.10614013671875, 1.1951904296875, 1.28424072265625, 1.373291015625, 1.46234130859375, 1.5513916015625, 1.64044189453125, 1.7294921875, 1.81854248046875, 1.9075927734375, 1.99664306640625, 2.085693359375, 2.17474365234375, 2.2637939453125, 2.35284423828125, 2.44189453125, 2.53094482421875, 2.6199951171875, 2.70904541015625, 2.798095703125, 2.88714599609375, 2.9761962890625, 3.06524658203125, 3.154296875]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 9.0, 5.0, 14.0, 9.0, 22.0, 31.0, 25.0, 44.0, 50.0, 98.0, 135.0, 197.0, 319.0, 496.0, 895.0, 1688.0, 3818.0, 11549.0, 49492.0, 321199.0, 2373076.0, 1243765.0, 146760.0, 27102.0, 7353.0, 2785.0, 1359.0, 692.0, 448.0, 243.0, 180.0, 109.0, 88.0, 58.0, 50.0, 39.0, 28.0, 12.0, 8.0, 11.0, 8.0, 5.0, 3.0, 0.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.865234375, -2.775146484375, -2.68505859375, -2.594970703125, -2.5048828125, -2.414794921875, -2.32470703125, -2.234619140625, -2.14453125, -2.054443359375, -1.96435546875, -1.874267578125, -1.7841796875, -1.694091796875, -1.60400390625, -1.513916015625, -1.423828125, -1.333740234375, -1.24365234375, -1.153564453125, -1.0634765625, -0.973388671875, -0.88330078125, -0.793212890625, -0.703125, -0.613037109375, -0.52294921875, -0.432861328125, -0.3427734375, -0.252685546875, -0.16259765625, -0.072509765625, 0.017578125, 0.107666015625, 0.19775390625, 0.287841796875, 0.3779296875, 0.468017578125, 0.55810546875, 0.648193359375, 0.73828125, 0.828369140625, 0.91845703125, 1.008544921875, 1.0986328125, 1.188720703125, 1.27880859375, 1.368896484375, 1.458984375, 1.549072265625, 1.63916015625, 1.729248046875, 1.8193359375, 1.909423828125, 1.99951171875, 2.089599609375, 2.1796875, 2.269775390625, 2.35986328125, 2.449951171875, 2.5400390625, 2.630126953125, 2.72021484375, 2.810302734375, 2.900390625]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 6.0, 8.0, 9.0, 12.0, 27.0, 30.0, 50.0, 39.0, 66.0, 95.0, 125.0, 181.0, 251.0, 330.0, 407.0, 491.0, 477.0, 396.0, 293.0, 225.0, 164.0, 109.0, 81.0, 66.0, 36.0, 27.0, 13.0, 21.0, 6.0, 15.0, 7.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.94970703125, -0.9188613891601562, -0.8880157470703125, -0.8571701049804688, -0.826324462890625, -0.7954788208007812, -0.7646331787109375, -0.7337875366210938, -0.70294189453125, -0.6720962524414062, -0.6412506103515625, -0.6104049682617188, -0.579559326171875, -0.5487136840820312, -0.5178680419921875, -0.48702239990234375, -0.4561767578125, -0.42533111572265625, -0.3944854736328125, -0.36363983154296875, -0.332794189453125, -0.30194854736328125, -0.2711029052734375, -0.24025726318359375, -0.20941162109375, -0.17856597900390625, -0.1477203369140625, -0.11687469482421875, -0.086029052734375, -0.05518341064453125, -0.0243377685546875, 0.00650787353515625, 0.037353515625, 0.06819915771484375, 0.0990447998046875, 0.12989044189453125, 0.160736083984375, 0.19158172607421875, 0.2224273681640625, 0.25327301025390625, 0.28411865234375, 0.31496429443359375, 0.3458099365234375, 0.37665557861328125, 0.407501220703125, 0.43834686279296875, 0.4691925048828125, 0.5000381469726562, 0.5308837890625, 0.5617294311523438, 0.5925750732421875, 0.6234207153320312, 0.654266357421875, 0.6851119995117188, 0.7159576416015625, 0.7468032836914062, 0.77764892578125, 0.8084945678710938, 0.8393402099609375, 0.8701858520507812, 0.901031494140625, 0.9318771362304688, 0.9627227783203125, 0.9935684204101562, 1.0244140625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 1.0, 3.0, 4.0, 6.0, 10.0, 12.0, 23.0, 48.0, 40.0, 78.0, 95.0, 116.0, 106.0, 123.0, 92.0, 75.0, 59.0, 45.0, 33.0, 17.0, 10.0, 4.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6815876960754395, -4.513382911682129, -4.345178604125977, -4.176973819732666, -4.0087690353393555, -3.840564727783203, -3.6723599433898926, -3.504155397415161, -3.3359508514404297, -3.1677463054656982, -2.999541759490967, -2.8313369750976562, -2.663132429122925, -2.4949278831481934, -2.326723098754883, -2.1585185527801514, -1.99031400680542, -1.8221094608306885, -1.6539047956466675, -1.4857001304626465, -1.317495584487915, -1.1492910385131836, -0.9810863733291626, -0.8128817081451416, -0.6446771621704102, -0.47647255659103394, -0.3082679510116577, -0.1400633454322815, 0.028141260147094727, 0.19634586572647095, 0.36455047130584717, 0.5327551364898682, 0.7009592056274414, 0.8691638112068176, 1.0373684167861938, 1.2055730819702148, 1.3737776279449463, 1.5419821739196777, 1.7101868391036987, 1.8783915042877197, 2.046596050262451, 2.2148005962371826, 2.383005142211914, 2.5512099266052246, 2.719414472579956, 2.8876190185546875, 3.055823802947998, 3.2240283489227295, 3.392232894897461, 3.5604374408721924, 3.728641986846924, 3.8968467712402344, 4.065051078796387, 4.233255863189697, 4.401460647583008, 4.56966495513916, 4.737869739532471, 4.906074523925781, 5.074278831481934, 5.242483615875244, 5.410688400268555, 5.578892707824707, 5.747097492218018, 5.915302276611328, 6.0835065841674805]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 7.0, 4.0, 4.0, 9.0, 13.0, 16.0, 21.0, 18.0, 15.0, 24.0, 40.0, 42.0, 35.0, 32.0, 52.0, 45.0, 42.0, 49.0, 57.0, 43.0, 43.0, 45.0, 39.0, 29.0, 39.0, 32.0, 30.0, 29.0, 22.0, 26.0, 20.0, 12.0, 16.0, 12.0, 11.0, 10.0, 3.0, 6.0, 6.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1871447563171387, -2.0993478298187256, -2.0115509033203125, -1.9237537384033203, -1.8359568119049072, -1.7481598854064941, -1.6603628396987915, -1.5725657939910889, -1.4847688674926758, -1.3969719409942627, -1.30917489528656, -1.2213778495788574, -1.1335809230804443, -1.0457839965820312, -0.9579869508743286, -0.8701899647712708, -0.7823929786682129, -0.694595992565155, -0.6067990064620972, -0.5190020203590393, -0.43120503425598145, -0.3434080481529236, -0.2556110620498657, -0.16781407594680786, -0.08001708984375, 0.007779896259307861, 0.09557688236236572, 0.18337386846542358, 0.27117085456848145, 0.3589678406715393, 0.44676482677459717, 0.534561812877655, 0.6223587989807129, 0.7101557850837708, 0.7979527711868286, 0.8857497572898865, 0.9735467433929443, 1.0613436698913574, 1.14914071559906, 1.2369377613067627, 1.3247346878051758, 1.4125316143035889, 1.5003286600112915, 1.5881257057189941, 1.6759226322174072, 1.7637195587158203, 1.851516604423523, 1.9393136501312256, 2.0271105766296387, 2.1149075031280518, 2.202704429626465, 2.290501594543457, 2.37829852104187, 2.466095447540283, 2.5538926124572754, 2.6416895389556885, 2.7294864654541016, 2.8172833919525146, 2.9050803184509277, 2.99287748336792, 3.080674409866333, 3.168471336364746, 3.2562685012817383, 3.3440654277801514, 3.4318623542785645]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 5.0, 4.0, 2.0, 2.0, 3.0, 9.0, 12.0, 10.0, 18.0, 45.0, 42.0, 72.0, 127.0, 187.0, 299.0, 475.0, 782.0, 1386.0, 2585.0, 4755.0, 8998.0, 17310.0, 34162.0, 69057.0, 134523.0, 222737.0, 236295.0, 152690.0, 79492.0, 39834.0, 20090.0, 10338.0, 5382.0, 2840.0, 1616.0, 959.0, 547.0, 360.0, 169.0, 124.0, 65.0, 54.0, 33.0, 21.0, 12.0, 8.0, 11.0, 10.0, 1.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.29833984375, -0.2880897521972656, -0.27783966064453125, -0.2675895690917969, -0.2573394775390625, -0.24708938598632812, -0.23683929443359375, -0.22658920288085938, -0.216339111328125, -0.20608901977539062, -0.19583892822265625, -0.18558883666992188, -0.1753387451171875, -0.16508865356445312, -0.15483856201171875, -0.14458847045898438, -0.13433837890625, -0.12408828735351562, -0.11383819580078125, -0.10358810424804688, -0.0933380126953125, -0.08308792114257812, -0.07283782958984375, -0.06258773803710938, -0.052337646484375, -0.042087554931640625, -0.03183746337890625, -0.021587371826171875, -0.0113372802734375, -0.001087188720703125, 0.00916290283203125, 0.019412994384765625, 0.0296630859375, 0.039913177490234375, 0.05016326904296875, 0.060413360595703125, 0.0706634521484375, 0.08091354370117188, 0.09116363525390625, 0.10141372680664062, 0.111663818359375, 0.12191390991210938, 0.13216400146484375, 0.14241409301757812, 0.1526641845703125, 0.16291427612304688, 0.17316436767578125, 0.18341445922851562, 0.19366455078125, 0.20391464233398438, 0.21416473388671875, 0.22441482543945312, 0.2346649169921875, 0.24491500854492188, 0.25516510009765625, 0.2654151916503906, 0.275665283203125, 0.2859153747558594, 0.29616546630859375, 0.3064155578613281, 0.3166656494140625, 0.3269157409667969, 0.33716583251953125, 0.3474159240722656, 0.357666015625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 7.0, 10.0, 5.0, 10.0, 18.0, 14.0, 23.0, 29.0, 32.0, 39.0, 50.0, 51.0, 54.0, 61.0, 46.0, 75.0, 52.0, 61.0, 54.0, 49.0, 42.0, 41.0, 34.0, 34.0, 19.0, 27.0, 21.0, 8.0, 11.0, 7.0, 7.0, 4.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.05078125, -1.977020263671875, -1.90325927734375, -1.829498291015625, -1.7557373046875, -1.681976318359375, -1.60821533203125, -1.534454345703125, -1.460693359375, -1.386932373046875, -1.31317138671875, -1.239410400390625, -1.1656494140625, -1.091888427734375, -1.01812744140625, -0.944366455078125, -0.87060546875, -0.796844482421875, -0.72308349609375, -0.649322509765625, -0.5755615234375, -0.501800537109375, -0.42803955078125, -0.354278564453125, -0.280517578125, -0.206756591796875, -0.13299560546875, -0.059234619140625, 0.0145263671875, 0.088287353515625, 0.16204833984375, 0.235809326171875, 0.3095703125, 0.383331298828125, 0.45709228515625, 0.530853271484375, 0.6046142578125, 0.678375244140625, 0.75213623046875, 0.825897216796875, 0.899658203125, 0.973419189453125, 1.04718017578125, 1.120941162109375, 1.1947021484375, 1.268463134765625, 1.34222412109375, 1.415985107421875, 1.48974609375, 1.563507080078125, 1.63726806640625, 1.711029052734375, 1.7847900390625, 1.858551025390625, 1.93231201171875, 2.006072998046875, 2.079833984375, 2.153594970703125, 2.22735595703125, 2.301116943359375, 2.3748779296875, 2.448638916015625, 2.52239990234375, 2.596160888671875, 2.669921875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 4.0, 7.0, 13.0, 11.0, 27.0, 33.0, 37.0, 55.0, 116.0, 181.0, 253.0, 350.0, 578.0, 924.0, 1468.0, 2286.0, 3756.0, 6067.0, 9921.0, 16653.0, 28144.0, 47509.0, 78949.0, 126556.0, 179745.0, 187269.0, 138586.0, 88279.0, 52505.0, 31036.0, 18509.0, 11112.0, 6808.0, 4083.0, 2488.0, 1575.0, 916.0, 600.0, 411.0, 259.0, 156.0, 113.0, 79.0, 42.0, 35.0, 23.0, 16.0, 9.0, 2.0, 6.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.19921875, -0.19237518310546875, -0.1855316162109375, -0.17868804931640625, -0.171844482421875, -0.16500091552734375, -0.1581573486328125, -0.15131378173828125, -0.14447021484375, -0.13762664794921875, -0.1307830810546875, -0.12393951416015625, -0.117095947265625, -0.11025238037109375, -0.1034088134765625, -0.09656524658203125, -0.0897216796875, -0.08287811279296875, -0.0760345458984375, -0.06919097900390625, -0.062347412109375, -0.05550384521484375, -0.0486602783203125, -0.04181671142578125, -0.03497314453125, -0.02812957763671875, -0.0212860107421875, -0.01444244384765625, -0.007598876953125, -0.00075531005859375, 0.0060882568359375, 0.01293182373046875, 0.019775390625, 0.02661895751953125, 0.0334625244140625, 0.04030609130859375, 0.047149658203125, 0.05399322509765625, 0.0608367919921875, 0.06768035888671875, 0.07452392578125, 0.08136749267578125, 0.0882110595703125, 0.09505462646484375, 0.101898193359375, 0.10874176025390625, 0.1155853271484375, 0.12242889404296875, 0.1292724609375, 0.13611602783203125, 0.1429595947265625, 0.14980316162109375, 0.156646728515625, 0.16349029541015625, 0.1703338623046875, 0.17717742919921875, 0.18402099609375, 0.19086456298828125, 0.1977081298828125, 0.20455169677734375, 0.211395263671875, 0.21823883056640625, 0.2250823974609375, 0.23192596435546875, 0.23876953125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 5.0, 1.0, 8.0, 7.0, 3.0, 10.0, 11.0, 17.0, 12.0, 18.0, 12.0, 22.0, 27.0, 22.0, 39.0, 45.0, 35.0, 52.0, 59.0, 65.0, 52.0, 47.0, 58.0, 61.0, 45.0, 39.0, 34.0, 31.0, 23.0, 25.0, 22.0, 19.0, 15.0, 16.0, 16.0, 12.0, 4.0, 6.0, 2.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.66015625, -3.5379638671875, -3.415771484375, -3.2935791015625, -3.17138671875, -3.0491943359375, -2.927001953125, -2.8048095703125, -2.6826171875, -2.5604248046875, -2.438232421875, -2.3160400390625, -2.19384765625, -2.0716552734375, -1.949462890625, -1.8272705078125, -1.705078125, -1.5828857421875, -1.460693359375, -1.3385009765625, -1.21630859375, -1.0941162109375, -0.971923828125, -0.8497314453125, -0.7275390625, -0.6053466796875, -0.483154296875, -0.3609619140625, -0.23876953125, -0.1165771484375, 0.005615234375, 0.1278076171875, 0.25, 0.3721923828125, 0.494384765625, 0.6165771484375, 0.73876953125, 0.8609619140625, 0.983154296875, 1.1053466796875, 1.2275390625, 1.3497314453125, 1.471923828125, 1.5941162109375, 1.71630859375, 1.8385009765625, 1.960693359375, 2.0828857421875, 2.205078125, 2.3272705078125, 2.449462890625, 2.5716552734375, 2.69384765625, 2.8160400390625, 2.938232421875, 3.0604248046875, 3.1826171875, 3.3048095703125, 3.427001953125, 3.5491943359375, 3.67138671875, 3.7935791015625, 3.915771484375, 4.0379638671875, 4.16015625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 3.0, 6.0, 11.0, 12.0, 14.0, 17.0, 21.0, 42.0, 67.0, 86.0, 111.0, 166.0, 263.0, 359.0, 556.0, 879.0, 1551.0, 2697.0, 5497.0, 11883.0, 29287.0, 72777.0, 192802.0, 373907.0, 215857.0, 80788.0, 32216.0, 13543.0, 6032.0, 2893.0, 1567.0, 913.0, 563.0, 358.0, 261.0, 163.0, 117.0, 77.0, 64.0, 44.0, 30.0, 16.0, 14.0, 7.0, 7.0, 3.0, 3.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 4.0], "bins": [-0.041748046875, -0.04050397872924805, -0.039259910583496094, -0.03801584243774414, -0.03677177429199219, -0.035527706146240234, -0.03428363800048828, -0.03303956985473633, -0.031795501708984375, -0.030551433563232422, -0.02930736541748047, -0.028063297271728516, -0.026819229125976562, -0.02557516098022461, -0.024331092834472656, -0.023087024688720703, -0.02184295654296875, -0.020598888397216797, -0.019354820251464844, -0.01811075210571289, -0.016866683959960938, -0.015622615814208984, -0.014378547668457031, -0.013134479522705078, -0.011890411376953125, -0.010646343231201172, -0.009402275085449219, -0.008158206939697266, -0.0069141387939453125, -0.005670070648193359, -0.004426002502441406, -0.003181934356689453, -0.0019378662109375, -0.0006937980651855469, 0.0005502700805664062, 0.0017943382263183594, 0.0030384063720703125, 0.004282474517822266, 0.005526542663574219, 0.006770610809326172, 0.008014678955078125, 0.009258747100830078, 0.010502815246582031, 0.011746883392333984, 0.012990951538085938, 0.01423501968383789, 0.015479087829589844, 0.016723155975341797, 0.01796722412109375, 0.019211292266845703, 0.020455360412597656, 0.02169942855834961, 0.022943496704101562, 0.024187564849853516, 0.02543163299560547, 0.026675701141357422, 0.027919769287109375, 0.029163837432861328, 0.03040790557861328, 0.031651973724365234, 0.03289604187011719, 0.03414011001586914, 0.035384178161621094, 0.03662824630737305, 0.037872314453125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 4.0, 7.0, 8.0, 11.0, 18.0, 27.0, 43.0, 70.0, 82.0, 105.0, 127.0, 126.0, 106.0, 63.0, 62.0, 41.0, 33.0, 21.0, 14.0, 15.0, 6.0, 5.0, 6.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.441904067993164e-05, -5.2912160754203796e-05, -5.140528082847595e-05, -4.989840090274811e-05, -4.8391520977020264e-05, -4.688464105129242e-05, -4.5377761125564575e-05, -4.387088119983673e-05, -4.236400127410889e-05, -4.085712134838104e-05, -3.93502414226532e-05, -3.7843361496925354e-05, -3.633648157119751e-05, -3.4829601645469666e-05, -3.332272171974182e-05, -3.181584179401398e-05, -3.0308961868286133e-05, -2.880208194255829e-05, -2.7295202016830444e-05, -2.57883220911026e-05, -2.4281442165374756e-05, -2.277456223964691e-05, -2.1267682313919067e-05, -1.9760802388191223e-05, -1.825392246246338e-05, -1.6747042536735535e-05, -1.524016261100769e-05, -1.3733282685279846e-05, -1.2226402759552002e-05, -1.0719522833824158e-05, -9.212642908096313e-06, -7.70576298236847e-06, -6.198883056640625e-06, -4.692003130912781e-06, -3.1851232051849365e-06, -1.6782432794570923e-06, -1.7136335372924805e-07, 1.3355165719985962e-06, 2.8423964977264404e-06, 4.349276423454285e-06, 5.856156349182129e-06, 7.363036274909973e-06, 8.869916200637817e-06, 1.0376796126365662e-05, 1.1883676052093506e-05, 1.339055597782135e-05, 1.4897435903549194e-05, 1.640431582927704e-05, 1.7911195755004883e-05, 1.9418075680732727e-05, 2.092495560646057e-05, 2.2431835532188416e-05, 2.393871545791626e-05, 2.5445595383644104e-05, 2.6952475309371948e-05, 2.8459355235099792e-05, 2.9966235160827637e-05, 3.147311508655548e-05, 3.2979995012283325e-05, 3.448687493801117e-05, 3.5993754863739014e-05, 3.750063478946686e-05, 3.90075147151947e-05, 4.0514394640922546e-05, 4.202127456665039e-05]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 6.0, 12.0, 10.0, 10.0, 26.0, 24.0, 46.0, 54.0, 61.0, 94.0, 155.0, 298.0, 532.0, 1248.0, 3007.0, 8031.0, 23491.0, 72940.0, 241580.0, 430138.0, 182529.0, 55249.0, 18095.0, 6366.0, 2380.0, 1011.0, 494.0, 230.0, 135.0, 106.0, 51.0, 38.0, 33.0, 19.0, 19.0, 10.0, 8.0, 7.0, 6.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.052001953125, -0.05048942565917969, -0.048976898193359375, -0.04746437072753906, -0.04595184326171875, -0.04443931579589844, -0.042926788330078125, -0.04141426086425781, -0.0399017333984375, -0.03838920593261719, -0.036876678466796875, -0.03536415100097656, -0.03385162353515625, -0.03233909606933594, -0.030826568603515625, -0.029314041137695312, -0.027801513671875, -0.026288986206054688, -0.024776458740234375, -0.023263931274414062, -0.02175140380859375, -0.020238876342773438, -0.018726348876953125, -0.017213821411132812, -0.0157012939453125, -0.014188766479492188, -0.012676239013671875, -0.011163711547851562, -0.00965118408203125, -0.008138656616210938, -0.006626129150390625, -0.0051136016845703125, -0.00360107421875, -0.0020885467529296875, -0.000576019287109375, 0.0009365081787109375, 0.00244903564453125, 0.0039615631103515625, 0.005474090576171875, 0.0069866180419921875, 0.0084991455078125, 0.010011672973632812, 0.011524200439453125, 0.013036727905273438, 0.01454925537109375, 0.016061782836914062, 0.017574310302734375, 0.019086837768554688, 0.020599365234375, 0.022111892700195312, 0.023624420166015625, 0.025136947631835938, 0.02664947509765625, 0.028162002563476562, 0.029674530029296875, 0.031187057495117188, 0.0326995849609375, 0.03421211242675781, 0.035724639892578125, 0.03723716735839844, 0.03874969482421875, 0.04026222229003906, 0.041774749755859375, 0.04328727722167969, 0.0447998046875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 6.0, 5.0, 8.0, 10.0, 8.0, 9.0, 17.0, 10.0, 17.0, 14.0, 23.0, 22.0, 29.0, 40.0, 47.0, 59.0, 71.0, 75.0, 87.0, 73.0, 72.0, 49.0, 39.0, 39.0, 22.0, 33.0, 13.0, 18.0, 18.0, 13.0, 8.0, 9.0, 15.0, 6.0, 5.0, 2.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01336669921875, -0.012975931167602539, -0.012585163116455078, -0.012194395065307617, -0.011803627014160156, -0.011412858963012695, -0.011022090911865234, -0.010631322860717773, -0.010240554809570312, -0.009849786758422852, -0.00945901870727539, -0.00906825065612793, -0.008677482604980469, -0.008286714553833008, -0.007895946502685547, -0.007505178451538086, -0.007114410400390625, -0.006723642349243164, -0.006332874298095703, -0.005942106246948242, -0.005551338195800781, -0.00516057014465332, -0.004769802093505859, -0.0043790340423583984, -0.0039882659912109375, -0.0035974979400634766, -0.0032067298889160156, -0.0028159618377685547, -0.0024251937866210938, -0.002034425735473633, -0.0016436576843261719, -0.001252889633178711, -0.00086212158203125, -0.00047135353088378906, -8.058547973632812e-05, 0.0003101825714111328, 0.0007009506225585938, 0.0010917186737060547, 0.0014824867248535156, 0.0018732547760009766, 0.0022640228271484375, 0.0026547908782958984, 0.0030455589294433594, 0.0034363269805908203, 0.0038270950317382812, 0.004217863082885742, 0.004608631134033203, 0.004999399185180664, 0.005390167236328125, 0.005780935287475586, 0.006171703338623047, 0.006562471389770508, 0.006953239440917969, 0.00734400749206543, 0.007734775543212891, 0.008125543594360352, 0.008516311645507812, 0.008907079696655273, 0.009297847747802734, 0.009688615798950195, 0.010079383850097656, 0.010470151901245117, 0.010860919952392578, 0.011251688003540039, 0.0116424560546875]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 22.0, 75.0, 207.0, 344.0, 229.0, 98.0, 27.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.285140991210938, -7.9953107833862305, -7.705480098724365, -7.4156494140625, -7.125819206237793, -6.835988998413086, -6.546158313751221, -6.2563276290893555, -5.966497421264648, -5.676667213439941, -5.386836528778076, -5.097005844116211, -4.807175636291504, -4.517345428466797, -4.227514743804932, -3.9376842975616455, -3.6478538513183594, -3.3580234050750732, -3.068192958831787, -2.778362512588501, -2.488532066345215, -2.1987016201019287, -1.9088711738586426, -1.6190407276153564, -1.3292102813720703, -1.0393798351287842, -0.749549388885498, -0.4597189426422119, -0.16988849639892578, 0.11994194984436035, 0.4097723960876465, 0.6996028423309326, 0.9894332885742188, 1.2792637348175049, 1.569094181060791, 1.8589246273040771, 2.1487550735473633, 2.4385855197906494, 2.7284159660339355, 3.0182464122772217, 3.308076858520508, 3.597907304763794, 3.88773775100708, 4.177568435668945, 4.467398643493652, 4.757228851318359, 5.047059535980225, 5.33689022064209, 5.626720428466797, 5.916550636291504, 6.206381320953369, 6.496212005615234, 6.786042213439941, 7.075872421264648, 7.365703105926514, 7.655533790588379, 7.945363998413086, 8.235194206237793, 8.5250244140625, 8.814855575561523, 9.10468578338623, 9.394515991210938, 9.684347152709961, 9.974177360534668, 10.264007568359375]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 5.0, 6.0, 6.0, 4.0, 8.0, 15.0, 10.0, 22.0, 26.0, 27.0, 35.0, 39.0, 57.0, 50.0, 61.0, 61.0, 69.0, 62.0, 54.0, 60.0, 43.0, 48.0, 42.0, 36.0, 25.0, 29.0, 30.0, 19.0, 15.0, 13.0, 13.0, 7.0, 4.0, 6.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.75247061252594, -1.680452585220337, -1.6084344387054443, -1.5364164113998413, -1.4643983840942383, -1.3923802375793457, -1.3203622102737427, -1.2483441829681396, -1.176326036453247, -1.104308009147644, -1.0322898626327515, -0.9602718353271484, -0.8882537484169006, -0.8162356615066528, -0.7442176342010498, -0.672199547290802, -0.6001814603805542, -0.5281633734703064, -0.456145316362381, -0.38412725925445557, -0.31210917234420776, -0.24009108543395996, -0.16807302832603455, -0.09605497121810913, -0.024036884307861328, 0.04798118770122528, 0.11999925971031189, 0.1920173317193985, 0.2640354037284851, 0.3360534906387329, 0.4080715477466583, 0.48008960485458374, 0.552107572555542, 0.6241256594657898, 0.6961437463760376, 0.7681617736816406, 0.8401798605918884, 0.9121979475021362, 0.9842159748077393, 1.0562341213226318, 1.1282521486282349, 1.200270175933838, 1.2722883224487305, 1.3443063497543335, 1.4163243770599365, 1.488342523574829, 1.5603605508804321, 1.6323785781860352, 1.7043967247009277, 1.7764147520065308, 1.8484328985214233, 1.9204509258270264, 1.992469072341919, 2.0644869804382324, 2.136505126953125, 2.2085232734680176, 2.28054141998291, 2.3525595664978027, 2.424577474594116, 2.496595621109009, 2.5686137676239014, 2.640631675720215, 2.7126498222351074, 2.78466796875, 2.8566858768463135]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 5.0, 5.0, 5.0, 8.0, 14.0, 10.0, 18.0, 21.0, 31.0, 37.0, 70.0, 112.0, 163.0, 301.0, 477.0, 845.0, 1679.0, 2996.0, 6544.0, 13119.0, 28816.0, 64778.0, 151884.0, 291144.0, 262220.0, 124225.0, 52830.0, 23681.0, 11123.0, 5420.0, 2640.0, 1433.0, 794.0, 401.0, 245.0, 163.0, 88.0, 68.0, 38.0, 28.0, 22.0, 16.0, 8.0, 6.0, 7.0, 9.0, 6.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-1.38671875, -1.3418121337890625, -1.296905517578125, -1.2519989013671875, -1.20709228515625, -1.1621856689453125, -1.117279052734375, -1.0723724365234375, -1.0274658203125, -0.9825592041015625, -0.937652587890625, -0.8927459716796875, -0.84783935546875, -0.8029327392578125, -0.758026123046875, -0.7131195068359375, -0.668212890625, -0.6233062744140625, -0.578399658203125, -0.5334930419921875, -0.48858642578125, -0.4436798095703125, -0.398773193359375, -0.3538665771484375, -0.3089599609375, -0.2640533447265625, -0.219146728515625, -0.1742401123046875, -0.12933349609375, -0.0844268798828125, -0.039520263671875, 0.0053863525390625, 0.05029296875, 0.0951995849609375, 0.140106201171875, 0.1850128173828125, 0.22991943359375, 0.2748260498046875, 0.319732666015625, 0.3646392822265625, 0.4095458984375, 0.4544525146484375, 0.499359130859375, 0.5442657470703125, 0.58917236328125, 0.6340789794921875, 0.678985595703125, 0.7238922119140625, 0.768798828125, 0.8137054443359375, 0.858612060546875, 0.9035186767578125, 0.94842529296875, 0.9933319091796875, 1.038238525390625, 1.0831451416015625, 1.1280517578125, 1.1729583740234375, 1.217864990234375, 1.2627716064453125, 1.30767822265625, 1.3525848388671875, 1.397491455078125, 1.4423980712890625, 1.4873046875]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 2.0, 3.0, 4.0, 3.0, 4.0, 3.0, 6.0, 8.0, 11.0, 15.0, 17.0, 17.0, 20.0, 26.0, 35.0, 29.0, 42.0, 51.0, 49.0, 33.0, 47.0, 54.0, 62.0, 52.0, 56.0, 38.0, 45.0, 40.0, 33.0, 33.0, 33.0, 29.0, 21.0, 17.0, 19.0, 14.0, 6.0, 11.0, 8.0, 5.0, 4.0, 3.0, 1.0, 1.0, 6.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.154296875, -3.035369873046875, -2.91644287109375, -2.797515869140625, -2.6785888671875, -2.559661865234375, -2.44073486328125, -2.321807861328125, -2.202880859375, -2.083953857421875, -1.96502685546875, -1.846099853515625, -1.7271728515625, -1.608245849609375, -1.48931884765625, -1.370391845703125, -1.25146484375, -1.132537841796875, -1.01361083984375, -0.894683837890625, -0.7757568359375, -0.656829833984375, -0.53790283203125, -0.418975830078125, -0.300048828125, -0.181121826171875, -0.06219482421875, 0.056732177734375, 0.1756591796875, 0.294586181640625, 0.41351318359375, 0.532440185546875, 0.6513671875, 0.770294189453125, 0.88922119140625, 1.008148193359375, 1.1270751953125, 1.246002197265625, 1.36492919921875, 1.483856201171875, 1.602783203125, 1.721710205078125, 1.84063720703125, 1.959564208984375, 2.0784912109375, 2.197418212890625, 2.31634521484375, 2.435272216796875, 2.55419921875, 2.673126220703125, 2.79205322265625, 2.910980224609375, 3.0299072265625, 3.148834228515625, 3.26776123046875, 3.386688232421875, 3.505615234375, 3.624542236328125, 3.74346923828125, 3.862396240234375, 3.9813232421875, 4.100250244140625, 4.21917724609375, 4.338104248046875, 4.45703125]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 1.0, 5.0, 5.0, 4.0, 5.0, 9.0, 22.0, 8.0, 22.0, 38.0, 49.0, 45.0, 69.0, 97.0, 138.0, 201.0, 343.0, 825.0, 3998.0, 51582.0, 724140.0, 250410.0, 13599.0, 1606.0, 487.0, 269.0, 170.0, 101.0, 77.0, 61.0, 29.0, 27.0, 26.0, 17.0, 15.0, 11.0, 9.0, 7.0, 10.0, 5.0, 4.0, 0.0, 4.0, 0.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.875, -4.7305908203125, -4.586181640625, -4.4417724609375, -4.29736328125, -4.1529541015625, -4.008544921875, -3.8641357421875, -3.7197265625, -3.5753173828125, -3.430908203125, -3.2864990234375, -3.14208984375, -2.9976806640625, -2.853271484375, -2.7088623046875, -2.564453125, -2.4200439453125, -2.275634765625, -2.1312255859375, -1.98681640625, -1.8424072265625, -1.697998046875, -1.5535888671875, -1.4091796875, -1.2647705078125, -1.120361328125, -0.9759521484375, -0.83154296875, -0.6871337890625, -0.542724609375, -0.3983154296875, -0.25390625, -0.1094970703125, 0.034912109375, 0.1793212890625, 0.32373046875, 0.4681396484375, 0.612548828125, 0.7569580078125, 0.9013671875, 1.0457763671875, 1.190185546875, 1.3345947265625, 1.47900390625, 1.6234130859375, 1.767822265625, 1.9122314453125, 2.056640625, 2.2010498046875, 2.345458984375, 2.4898681640625, 2.63427734375, 2.7786865234375, 2.923095703125, 3.0675048828125, 3.2119140625, 3.3563232421875, 3.500732421875, 3.6451416015625, 3.78955078125, 3.9339599609375, 4.078369140625, 4.2227783203125, 4.3671875]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 9.0, 7.0, 5.0, 3.0, 11.0, 14.0, 18.0, 17.0, 21.0, 21.0, 17.0, 34.0, 39.0, 32.0, 33.0, 43.0, 36.0, 43.0, 52.0, 51.0, 52.0, 41.0, 42.0, 45.0, 48.0, 33.0, 33.0, 27.0, 20.0, 25.0, 19.0, 19.0, 21.0, 13.0, 14.0, 10.0, 9.0, 9.0, 3.0, 3.0, 6.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.203125, -4.0670166015625, -3.930908203125, -3.7947998046875, -3.65869140625, -3.5225830078125, -3.386474609375, -3.2503662109375, -3.1142578125, -2.9781494140625, -2.842041015625, -2.7059326171875, -2.56982421875, -2.4337158203125, -2.297607421875, -2.1614990234375, -2.025390625, -1.8892822265625, -1.753173828125, -1.6170654296875, -1.48095703125, -1.3448486328125, -1.208740234375, -1.0726318359375, -0.9365234375, -0.8004150390625, -0.664306640625, -0.5281982421875, -0.39208984375, -0.2559814453125, -0.119873046875, 0.0162353515625, 0.15234375, 0.2884521484375, 0.424560546875, 0.5606689453125, 0.69677734375, 0.8328857421875, 0.968994140625, 1.1051025390625, 1.2412109375, 1.3773193359375, 1.513427734375, 1.6495361328125, 1.78564453125, 1.9217529296875, 2.057861328125, 2.1939697265625, 2.330078125, 2.4661865234375, 2.602294921875, 2.7384033203125, 2.87451171875, 3.0106201171875, 3.146728515625, 3.2828369140625, 3.4189453125, 3.5550537109375, 3.691162109375, 3.8272705078125, 3.96337890625, 4.0994873046875, 4.235595703125, 4.3717041015625, 4.5078125]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 6.0, 9.0, 8.0, 16.0, 24.0, 35.0, 72.0, 186.0, 486.0, 1764.0, 7098.0, 185098.0, 830388.0, 18935.0, 3023.0, 847.0, 293.0, 112.0, 46.0, 26.0, 22.0, 15.0, 10.0, 3.0, 10.0, 4.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-3.306640625, -3.217803955078125, -3.12896728515625, -3.040130615234375, -2.9512939453125, -2.862457275390625, -2.77362060546875, -2.684783935546875, -2.595947265625, -2.507110595703125, -2.41827392578125, -2.329437255859375, -2.2406005859375, -2.151763916015625, -2.06292724609375, -1.974090576171875, -1.88525390625, -1.796417236328125, -1.70758056640625, -1.618743896484375, -1.5299072265625, -1.441070556640625, -1.35223388671875, -1.263397216796875, -1.174560546875, -1.085723876953125, -0.99688720703125, -0.908050537109375, -0.8192138671875, -0.730377197265625, -0.64154052734375, -0.552703857421875, -0.4638671875, -0.375030517578125, -0.28619384765625, -0.197357177734375, -0.1085205078125, -0.019683837890625, 0.06915283203125, 0.157989501953125, 0.246826171875, 0.335662841796875, 0.42449951171875, 0.513336181640625, 0.6021728515625, 0.691009521484375, 0.77984619140625, 0.868682861328125, 0.95751953125, 1.046356201171875, 1.13519287109375, 1.224029541015625, 1.3128662109375, 1.401702880859375, 1.49053955078125, 1.579376220703125, 1.668212890625, 1.757049560546875, 1.84588623046875, 1.934722900390625, 2.0235595703125, 2.112396240234375, 2.20123291015625, 2.290069580078125, 2.37890625]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 1.0, 0.0, 6.0, 3.0, 3.0, 10.0, 14.0, 22.0, 47.0, 84.0, 149.0, 178.0, 197.0, 115.0, 70.0, 46.0, 24.0, 15.0, 8.0, 7.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00037288665771484375, -0.0003618672490119934, -0.00035084784030914307, -0.0003398284316062927, -0.0003288090229034424, -0.00031778961420059204, -0.0003067702054977417, -0.00029575079679489136, -0.000284731388092041, -0.0002737119793891907, -0.00026269257068634033, -0.00025167316198349, -0.00024065375328063965, -0.0002296343445777893, -0.00021861493587493896, -0.00020759552717208862, -0.00019657611846923828, -0.00018555670976638794, -0.0001745373010635376, -0.00016351789236068726, -0.00015249848365783691, -0.00014147907495498657, -0.00013045966625213623, -0.00011944025754928589, -0.00010842084884643555, -9.74014401435852e-05, -8.638203144073486e-05, -7.536262273788452e-05, -6.434321403503418e-05, -5.332380533218384e-05, -4.2304396629333496e-05, -3.1284987926483154e-05, -2.0265579223632812e-05, -9.24617052078247e-06, 1.773238182067871e-06, 1.2792646884918213e-05, 2.3812055587768555e-05, 3.4831464290618896e-05, 4.585087299346924e-05, 5.687028169631958e-05, 6.788969039916992e-05, 7.890909910202026e-05, 8.99285078048706e-05, 0.00010094791650772095, 0.00011196732521057129, 0.00012298673391342163, 0.00013400614261627197, 0.00014502555131912231, 0.00015604496002197266, 0.000167064368724823, 0.00017808377742767334, 0.00018910318613052368, 0.00020012259483337402, 0.00021114200353622437, 0.0002221614122390747, 0.00023318082094192505, 0.0002442002296447754, 0.00025521963834762573, 0.0002662390470504761, 0.0002772584557533264, 0.00028827786445617676, 0.0002992972731590271, 0.00031031668186187744, 0.0003213360905647278, 0.0003323554992675781]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 7.0, 3.0, 5.0, 6.0, 7.0, 7.0, 13.0, 18.0, 35.0, 54.0, 102.0, 197.0, 327.0, 803.0, 2037.0, 6906.0, 85967.0, 866122.0, 75871.0, 6577.0, 1951.0, 796.0, 324.0, 161.0, 93.0, 51.0, 39.0, 17.0, 18.0, 9.0, 3.0, 6.0, 5.0, 1.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-1.8271484375, -1.7554473876953125, -1.683746337890625, -1.6120452880859375, -1.54034423828125, -1.4686431884765625, -1.396942138671875, -1.3252410888671875, -1.2535400390625, -1.1818389892578125, -1.110137939453125, -1.0384368896484375, -0.96673583984375, -0.8950347900390625, -0.823333740234375, -0.7516326904296875, -0.679931640625, -0.6082305908203125, -0.536529541015625, -0.4648284912109375, -0.39312744140625, -0.3214263916015625, -0.249725341796875, -0.1780242919921875, -0.1063232421875, -0.0346221923828125, 0.037078857421875, 0.1087799072265625, 0.18048095703125, 0.2521820068359375, 0.323883056640625, 0.3955841064453125, 0.46728515625, 0.5389862060546875, 0.610687255859375, 0.6823883056640625, 0.75408935546875, 0.8257904052734375, 0.897491455078125, 0.9691925048828125, 1.0408935546875, 1.1125946044921875, 1.184295654296875, 1.2559967041015625, 1.32769775390625, 1.3993988037109375, 1.471099853515625, 1.5428009033203125, 1.614501953125, 1.6862030029296875, 1.757904052734375, 1.8296051025390625, 1.90130615234375, 1.9730072021484375, 2.044708251953125, 2.1164093017578125, 2.1881103515625, 2.2598114013671875, 2.331512451171875, 2.4032135009765625, 2.47491455078125, 2.5466156005859375, 2.618316650390625, 2.6900177001953125, 2.76171875]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 7.0, 8.0, 6.0, 16.0, 14.0, 25.0, 38.0, 51.0, 96.0, 117.0, 110.0, 126.0, 101.0, 76.0, 64.0, 44.0, 31.0, 21.0, 12.0, 9.0, 9.0, 6.0, 3.0, 5.0, 2.0, 2.0, 6.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6015625, -0.5828628540039062, -0.5641632080078125, -0.5454635620117188, -0.526763916015625, -0.5080642700195312, -0.4893646240234375, -0.47066497802734375, -0.45196533203125, -0.43326568603515625, -0.4145660400390625, -0.39586639404296875, -0.377166748046875, -0.35846710205078125, -0.3397674560546875, -0.32106781005859375, -0.3023681640625, -0.28366851806640625, -0.2649688720703125, -0.24626922607421875, -0.227569580078125, -0.20886993408203125, -0.1901702880859375, -0.17147064208984375, -0.15277099609375, -0.13407135009765625, -0.1153717041015625, -0.09667205810546875, -0.077972412109375, -0.05927276611328125, -0.0405731201171875, -0.02187347412109375, -0.003173828125, 0.01552581787109375, 0.0342254638671875, 0.05292510986328125, 0.071624755859375, 0.09032440185546875, 0.1090240478515625, 0.12772369384765625, 0.14642333984375, 0.16512298583984375, 0.1838226318359375, 0.20252227783203125, 0.221221923828125, 0.23992156982421875, 0.2586212158203125, 0.27732086181640625, 0.2960205078125, 0.31472015380859375, 0.3334197998046875, 0.35211944580078125, 0.370819091796875, 0.38951873779296875, 0.4082183837890625, 0.42691802978515625, 0.44561767578125, 0.46431732177734375, 0.4830169677734375, 0.5017166137695312, 0.520416259765625, 0.5391159057617188, 0.5578155517578125, 0.5765151977539062, 0.59521484375]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 17.0, 49.0, 149.0, 292.0, 307.0, 133.0, 47.0, 7.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.72396469116211, -29.14010238647461, -28.556238174438477, -27.972375869750977, -27.388513565063477, -26.804651260375977, -26.220787048339844, -25.636924743652344, -25.053062438964844, -24.469200134277344, -23.88533592224121, -23.30147361755371, -22.71761131286621, -22.13374900817871, -21.549884796142578, -20.966022491455078, -20.382160186767578, -19.798297882080078, -19.214433670043945, -18.630571365356445, -18.046709060668945, -17.462846755981445, -16.878982543945312, -16.295120239257812, -15.71125602722168, -15.127392768859863, -14.543530464172363, -13.959667205810547, -13.375804901123047, -12.79194164276123, -12.208078384399414, -11.624216079711914, -11.040355682373047, -10.45649242401123, -9.87263011932373, -9.288766860961914, -8.704904556274414, -8.121041297912598, -7.5371785163879395, -6.953315734863281, -6.369452476501465, -5.785589694976807, -5.201726913452148, -4.617863655090332, -4.034001350402832, -3.4501383304595947, -2.8662753105163574, -2.282412528991699, -1.698549747467041, -1.1146869659423828, -0.5308240652084351, 0.053038835525512695, 0.6369016170501709, 1.220764398574829, 1.8046274185180664, 2.3884902000427246, 2.972352981567383, 3.556215763092041, 4.140078544616699, 4.723941802978516, 5.307804107666016, 5.891667366027832, 6.47553014755249, 7.059392929077148, 7.643255710601807]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 4.0, 9.0, 4.0, 10.0, 7.0, 13.0, 12.0, 21.0, 18.0, 18.0, 32.0, 34.0, 23.0, 26.0, 33.0, 46.0, 39.0, 36.0, 36.0, 38.0, 39.0, 46.0, 37.0, 31.0, 43.0, 39.0, 26.0, 23.0, 39.0, 24.0, 26.0, 21.0, 20.0, 20.0, 15.0, 16.0, 18.0, 6.0, 8.0, 4.0, 14.0, 7.0, 6.0, 10.0, 2.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.120534896850586, -5.917450428009033, -5.7143659591674805, -5.5112810134887695, -5.308196544647217, -5.105112075805664, -4.902027130126953, -4.6989426612854, -4.495858192443848, -4.292773723602295, -4.089689254760742, -3.8866043090820312, -3.6835198402404785, -3.480435371398926, -3.277350664138794, -3.074265956878662, -2.8711814880371094, -2.6680970191955566, -2.465012311935425, -2.261927604675293, -2.0588431358337402, -1.855758547782898, -1.6526739597320557, -1.4495893716812134, -1.246504783630371, -1.0434201955795288, -0.8403356075286865, -0.6372510194778442, -0.43416643142700195, -0.23108184337615967, -0.027997255325317383, 0.1750873327255249, 0.3781719207763672, 0.5812565088272095, 0.7843410968780518, 0.987425684928894, 1.1905102729797363, 1.3935948610305786, 1.596679449081421, 1.7997640371322632, 2.0028486251831055, 2.205933094024658, 2.40901780128479, 2.612102508544922, 2.8151869773864746, 3.0182714462280273, 3.221356153488159, 3.424440860748291, 3.6275253295898438, 3.8306097984313965, 4.033694267272949, 4.23677921295166, 4.439863681793213, 4.642948150634766, 4.846033096313477, 5.049117565155029, 5.252202033996582, 5.455286502838135, 5.6583709716796875, 5.861455917358398, 6.064540386199951, 6.267624855041504, 6.470709800720215, 6.673794269561768, 6.87687873840332]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 4.0, 4.0, 8.0, 14.0, 15.0, 28.0, 31.0, 42.0, 74.0, 120.0, 143.0, 215.0, 390.0, 778.0, 1995.0, 9057.0, 80389.0, 1338919.0, 2548805.0, 193484.0, 15849.0, 2477.0, 672.0, 264.0, 155.0, 94.0, 70.0, 53.0, 29.0, 28.0, 16.0, 16.0, 8.0, 12.0, 6.0, 9.0, 2.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.66015625, -4.5003662109375, -4.340576171875, -4.1807861328125, -4.02099609375, -3.8612060546875, -3.701416015625, -3.5416259765625, -3.3818359375, -3.2220458984375, -3.062255859375, -2.9024658203125, -2.74267578125, -2.5828857421875, -2.423095703125, -2.2633056640625, -2.103515625, -1.9437255859375, -1.783935546875, -1.6241455078125, -1.46435546875, -1.3045654296875, -1.144775390625, -0.9849853515625, -0.8251953125, -0.6654052734375, -0.505615234375, -0.3458251953125, -0.18603515625, -0.0262451171875, 0.133544921875, 0.2933349609375, 0.453125, 0.6129150390625, 0.772705078125, 0.9324951171875, 1.09228515625, 1.2520751953125, 1.411865234375, 1.5716552734375, 1.7314453125, 1.8912353515625, 2.051025390625, 2.2108154296875, 2.37060546875, 2.5303955078125, 2.690185546875, 2.8499755859375, 3.009765625, 3.1695556640625, 3.329345703125, 3.4891357421875, 3.64892578125, 3.8087158203125, 3.968505859375, 4.1282958984375, 4.2880859375, 4.4478759765625, 4.607666015625, 4.7674560546875, 4.92724609375, 5.0870361328125, 5.246826171875, 5.4066162109375, 5.56640625]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 7.0, 5.0, 4.0, 10.0, 8.0, 17.0, 16.0, 34.0, 25.0, 48.0, 42.0, 49.0, 46.0, 46.0, 68.0, 70.0, 79.0, 58.0, 63.0, 58.0, 49.0, 44.0, 35.0, 23.0, 20.0, 23.0, 18.0, 11.0, 7.0, 11.0, 5.0, 3.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.421875, -2.32513427734375, -2.2283935546875, -2.13165283203125, -2.034912109375, -1.93817138671875, -1.8414306640625, -1.74468994140625, -1.64794921875, -1.55120849609375, -1.4544677734375, -1.35772705078125, -1.260986328125, -1.16424560546875, -1.0675048828125, -0.97076416015625, -0.8740234375, -0.77728271484375, -0.6805419921875, -0.58380126953125, -0.487060546875, -0.39031982421875, -0.2935791015625, -0.19683837890625, -0.10009765625, -0.00335693359375, 0.0933837890625, 0.19012451171875, 0.286865234375, 0.38360595703125, 0.4803466796875, 0.57708740234375, 0.673828125, 0.77056884765625, 0.8673095703125, 0.96405029296875, 1.060791015625, 1.15753173828125, 1.2542724609375, 1.35101318359375, 1.44775390625, 1.54449462890625, 1.6412353515625, 1.73797607421875, 1.834716796875, 1.93145751953125, 2.0281982421875, 2.12493896484375, 2.2216796875, 2.31842041015625, 2.4151611328125, 2.51190185546875, 2.608642578125, 2.70538330078125, 2.8021240234375, 2.89886474609375, 2.99560546875, 3.09234619140625, 3.1890869140625, 3.28582763671875, 3.382568359375, 3.47930908203125, 3.5760498046875, 3.67279052734375, 3.76953125]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 3.0, 13.0, 21.0, 14.0, 28.0, 35.0, 55.0, 78.0, 127.0, 178.0, 262.0, 431.0, 740.0, 1506.0, 3551.0, 11711.0, 64129.0, 667702.0, 2978303.0, 404985.0, 44913.0, 9234.0, 2946.0, 1373.0, 710.0, 418.0, 256.0, 172.0, 122.0, 72.0, 54.0, 40.0, 31.0, 24.0, 19.0, 12.0, 4.0, 2.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-3.166015625, -3.058349609375, -2.95068359375, -2.843017578125, -2.7353515625, -2.627685546875, -2.52001953125, -2.412353515625, -2.3046875, -2.197021484375, -2.08935546875, -1.981689453125, -1.8740234375, -1.766357421875, -1.65869140625, -1.551025390625, -1.443359375, -1.335693359375, -1.22802734375, -1.120361328125, -1.0126953125, -0.905029296875, -0.79736328125, -0.689697265625, -0.58203125, -0.474365234375, -0.36669921875, -0.259033203125, -0.1513671875, -0.043701171875, 0.06396484375, 0.171630859375, 0.279296875, 0.386962890625, 0.49462890625, 0.602294921875, 0.7099609375, 0.817626953125, 0.92529296875, 1.032958984375, 1.140625, 1.248291015625, 1.35595703125, 1.463623046875, 1.5712890625, 1.678955078125, 1.78662109375, 1.894287109375, 2.001953125, 2.109619140625, 2.21728515625, 2.324951171875, 2.4326171875, 2.540283203125, 2.64794921875, 2.755615234375, 2.86328125, 2.970947265625, 3.07861328125, 3.186279296875, 3.2939453125, 3.401611328125, 3.50927734375, 3.616943359375, 3.724609375]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 1.0, 2.0, 3.0, 3.0, 1.0, 10.0, 7.0, 10.0, 16.0, 31.0, 15.0, 32.0, 58.0, 64.0, 91.0, 130.0, 191.0, 241.0, 354.0, 403.0, 471.0, 483.0, 425.0, 297.0, 219.0, 144.0, 106.0, 68.0, 57.0, 39.0, 22.0, 25.0, 18.0, 12.0, 11.0, 4.0, 5.0, 8.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.2265625, -1.1948623657226562, -1.1631622314453125, -1.1314620971679688, -1.099761962890625, -1.0680618286132812, -1.0363616943359375, -1.0046615600585938, -0.97296142578125, -0.9412612915039062, -0.9095611572265625, -0.8778610229492188, -0.846160888671875, -0.8144607543945312, -0.7827606201171875, -0.7510604858398438, -0.7193603515625, -0.6876602172851562, -0.6559600830078125, -0.6242599487304688, -0.592559814453125, -0.5608596801757812, -0.5291595458984375, -0.49745941162109375, -0.46575927734375, -0.43405914306640625, -0.4023590087890625, -0.37065887451171875, -0.338958740234375, -0.30725860595703125, -0.2755584716796875, -0.24385833740234375, -0.212158203125, -0.18045806884765625, -0.1487579345703125, -0.11705780029296875, -0.085357666015625, -0.05365753173828125, -0.0219573974609375, 0.00974273681640625, 0.04144287109375, 0.07314300537109375, 0.1048431396484375, 0.13654327392578125, 0.168243408203125, 0.19994354248046875, 0.2316436767578125, 0.26334381103515625, 0.2950439453125, 0.32674407958984375, 0.3584442138671875, 0.39014434814453125, 0.421844482421875, 0.45354461669921875, 0.4852447509765625, 0.5169448852539062, 0.54864501953125, 0.5803451538085938, 0.6120452880859375, 0.6437454223632812, 0.675445556640625, 0.7071456909179688, 0.7388458251953125, 0.7705459594726562, 0.80224609375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 4.0, 6.0, 10.0, 11.0, 32.0, 32.0, 41.0, 50.0, 66.0, 89.0, 99.0, 93.0, 107.0, 92.0, 73.0, 60.0, 44.0, 29.0, 27.0, 19.0, 8.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.473639965057373, -5.331472873687744, -5.189305305480957, -5.047138214111328, -4.904971122741699, -4.76280403137207, -4.620636940002441, -4.478469371795654, -4.336302280426025, -4.1941351890563965, -4.051967620849609, -3.9098005294799805, -3.7676334381103516, -3.6254663467407227, -3.4832990169525146, -3.3411316871643066, -3.1989645957946777, -3.056797504425049, -2.914630174636841, -2.772462844848633, -2.630295753479004, -2.488128662109375, -2.345961332321167, -2.203794002532959, -2.06162691116333, -1.9194597005844116, -1.7772924900054932, -1.6351252794265747, -1.4929580688476562, -1.3507908582687378, -1.2086236476898193, -1.0664564371109009, -0.9242887496948242, -0.7821215391159058, -0.6399543285369873, -0.49778711795806885, -0.3556199073791504, -0.21345269680023193, -0.07128548622131348, 0.07088172435760498, 0.21304893493652344, 0.3552161455154419, 0.49738335609436035, 0.6395505666732788, 0.7817177772521973, 0.9238849878311157, 1.0660521984100342, 1.2082194089889526, 1.350386619567871, 1.4925538301467896, 1.634721040725708, 1.7768882513046265, 1.919055461883545, 2.061222553253174, 2.203389883041382, 2.34555721282959, 2.4877243041992188, 2.6298913955688477, 2.7720587253570557, 2.9142260551452637, 3.0563931465148926, 3.1985602378845215, 3.3407275676727295, 3.4828948974609375, 3.6250619888305664]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 6.0, 2.0, 5.0, 5.0, 2.0, 7.0, 6.0, 12.0, 19.0, 16.0, 25.0, 15.0, 29.0, 27.0, 32.0, 38.0, 47.0, 41.0, 39.0, 39.0, 45.0, 42.0, 47.0, 64.0, 48.0, 51.0, 37.0, 31.0, 30.0, 35.0, 34.0, 34.0, 20.0, 12.0, 14.0, 14.0, 8.0, 9.0, 6.0, 8.0, 3.0, 5.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9903507232666016, -1.9063572883605957, -1.8223639726638794, -1.7383705377578735, -1.6543771028518677, -1.5703837871551514, -1.4863903522491455, -1.4023969173431396, -1.3184034824371338, -1.234410047531128, -1.1504167318344116, -1.0664232969284058, -0.9824298620223999, -0.8984364867210388, -0.8144431114196777, -0.7304496765136719, -0.6464563608169556, -0.5624629855155945, -0.4784695506095886, -0.39447617530822754, -0.31048277020454407, -0.2264893651008606, -0.1424959897994995, -0.05850255489349365, 0.02549082040786743, 0.1094842180609703, 0.19347761571407318, 0.27747100591659546, 0.36146441102027893, 0.4454578161239624, 0.5294511914253235, 0.6134446263313293, 0.6974380016326904, 0.7814313769340515, 0.8654248118400574, 0.9494181871414185, 1.0334116220474243, 1.1174049377441406, 1.2013983726501465, 1.2853918075561523, 1.3693852424621582, 1.453378677368164, 1.5373719930648804, 1.6213654279708862, 1.705358862876892, 1.7893521785736084, 1.8733456134796143, 1.9573390483856201, 2.041332244873047, 2.1253256797790527, 2.2093191146850586, 2.2933125495910645, 2.377305746078491, 2.461299180984497, 2.545292615890503, 2.629286050796509, 2.7132794857025146, 2.7972729206085205, 2.8812663555145264, 2.965259552001953, 3.049252986907959, 3.133246421813965, 3.2172398567199707, 3.3012332916259766, 3.3852267265319824]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 2.0, 4.0, 9.0, 8.0, 14.0, 27.0, 33.0, 52.0, 96.0, 138.0, 268.0, 379.0, 919.0, 1972.0, 4871.0, 13039.0, 40157.0, 129187.0, 337371.0, 333228.0, 126188.0, 39141.0, 12931.0, 4717.0, 1906.0, 886.0, 414.0, 240.0, 132.0, 78.0, 56.0, 28.0, 32.0, 19.0, 5.0, 6.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.54638671875, -0.5287551879882812, -0.5111236572265625, -0.49349212646484375, -0.475860595703125, -0.45822906494140625, -0.4405975341796875, -0.42296600341796875, -0.40533447265625, -0.38770294189453125, -0.3700714111328125, -0.35243988037109375, -0.334808349609375, -0.31717681884765625, -0.2995452880859375, -0.28191375732421875, -0.2642822265625, -0.24665069580078125, -0.2290191650390625, -0.21138763427734375, -0.193756103515625, -0.17612457275390625, -0.1584930419921875, -0.14086151123046875, -0.12322998046875, -0.10559844970703125, -0.0879669189453125, -0.07033538818359375, -0.052703857421875, -0.03507232666015625, -0.0174407958984375, 0.00019073486328125, 0.017822265625, 0.03545379638671875, 0.0530853271484375, 0.07071685791015625, 0.088348388671875, 0.10597991943359375, 0.1236114501953125, 0.14124298095703125, 0.15887451171875, 0.17650604248046875, 0.1941375732421875, 0.21176910400390625, 0.229400634765625, 0.24703216552734375, 0.2646636962890625, 0.28229522705078125, 0.2999267578125, 0.31755828857421875, 0.3351898193359375, 0.35282135009765625, 0.370452880859375, 0.38808441162109375, 0.4057159423828125, 0.42334747314453125, 0.44097900390625, 0.45861053466796875, 0.4762420654296875, 0.49387359619140625, 0.511505126953125, 0.5291366577148438, 0.5467681884765625, 0.5643997192382812, 0.58203125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 6.0, 2.0, 6.0, 5.0, 11.0, 17.0, 18.0, 28.0, 20.0, 36.0, 43.0, 36.0, 42.0, 53.0, 71.0, 80.0, 61.0, 55.0, 48.0, 62.0, 53.0, 47.0, 48.0, 23.0, 36.0, 33.0, 19.0, 11.0, 7.0, 12.0, 4.0, 8.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.75, -1.673248291015625, -1.59649658203125, -1.519744873046875, -1.4429931640625, -1.366241455078125, -1.28948974609375, -1.212738037109375, -1.135986328125, -1.059234619140625, -0.98248291015625, -0.905731201171875, -0.8289794921875, -0.752227783203125, -0.67547607421875, -0.598724365234375, -0.52197265625, -0.445220947265625, -0.36846923828125, -0.291717529296875, -0.2149658203125, -0.138214111328125, -0.06146240234375, 0.015289306640625, 0.092041015625, 0.168792724609375, 0.24554443359375, 0.322296142578125, 0.3990478515625, 0.475799560546875, 0.55255126953125, 0.629302978515625, 0.7060546875, 0.782806396484375, 0.85955810546875, 0.936309814453125, 1.0130615234375, 1.089813232421875, 1.16656494140625, 1.243316650390625, 1.320068359375, 1.396820068359375, 1.47357177734375, 1.550323486328125, 1.6270751953125, 1.703826904296875, 1.78057861328125, 1.857330322265625, 1.93408203125, 2.010833740234375, 2.08758544921875, 2.164337158203125, 2.2410888671875, 2.317840576171875, 2.39459228515625, 2.471343994140625, 2.548095703125, 2.624847412109375, 2.70159912109375, 2.778350830078125, 2.8551025390625, 2.931854248046875, 3.00860595703125, 3.085357666015625, 3.162109375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 5.0, 3.0, 12.0, 11.0, 14.0, 25.0, 34.0, 50.0, 85.0, 126.0, 196.0, 317.0, 491.0, 708.0, 1145.0, 1761.0, 2914.0, 4619.0, 7538.0, 11819.0, 19030.0, 29740.0, 46383.0, 71340.0, 105166.0, 141018.0, 157844.0, 141102.0, 105637.0, 72048.0, 46719.0, 29707.0, 18887.0, 12044.0, 7547.0, 4504.0, 2871.0, 1812.0, 1188.0, 748.0, 474.0, 315.0, 203.0, 112.0, 82.0, 60.0, 33.0, 29.0, 14.0, 8.0, 5.0, 8.0, 5.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1788330078125, -0.1727733612060547, -0.16671371459960938, -0.16065406799316406, -0.15459442138671875, -0.14853477478027344, -0.14247512817382812, -0.1364154815673828, -0.1303558349609375, -0.12429618835449219, -0.11823654174804688, -0.11217689514160156, -0.10611724853515625, -0.10005760192871094, -0.09399795532226562, -0.08793830871582031, -0.081878662109375, -0.07581901550292969, -0.06975936889648438, -0.06369972229003906, -0.05764007568359375, -0.05158042907714844, -0.045520782470703125, -0.03946113586425781, -0.0334014892578125, -0.027341842651367188, -0.021282196044921875, -0.015222549438476562, -0.00916290283203125, -0.0031032562255859375, 0.002956390380859375, 0.009016036987304688, 0.01507568359375, 0.021135330200195312, 0.027194976806640625, 0.03325462341308594, 0.03931427001953125, 0.04537391662597656, 0.051433563232421875, 0.05749320983886719, 0.0635528564453125, 0.06961250305175781, 0.07567214965820312, 0.08173179626464844, 0.08779144287109375, 0.09385108947753906, 0.09991073608398438, 0.10597038269042969, 0.112030029296875, 0.11808967590332031, 0.12414932250976562, 0.13020896911621094, 0.13626861572265625, 0.14232826232910156, 0.14838790893554688, 0.1544475555419922, 0.1605072021484375, 0.1665668487548828, 0.17262649536132812, 0.17868614196777344, 0.18474578857421875, 0.19080543518066406, 0.19686508178710938, 0.2029247283935547, 0.208984375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 6.0, 4.0, 9.0, 11.0, 16.0, 12.0, 12.0, 20.0, 29.0, 24.0, 20.0, 28.0, 27.0, 30.0, 46.0, 51.0, 44.0, 52.0, 61.0, 60.0, 43.0, 41.0, 40.0, 47.0, 38.0, 27.0, 25.0, 26.0, 22.0, 23.0, 18.0, 17.0, 12.0, 17.0, 15.0, 12.0, 10.0, 3.0, 6.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.279296875, -3.164581298828125, -3.04986572265625, -2.935150146484375, -2.8204345703125, -2.705718994140625, -2.59100341796875, -2.476287841796875, -2.361572265625, -2.246856689453125, -2.13214111328125, -2.017425537109375, -1.9027099609375, -1.787994384765625, -1.67327880859375, -1.558563232421875, -1.44384765625, -1.329132080078125, -1.21441650390625, -1.099700927734375, -0.9849853515625, -0.870269775390625, -0.75555419921875, -0.640838623046875, -0.526123046875, -0.411407470703125, -0.29669189453125, -0.181976318359375, -0.0672607421875, 0.047454833984375, 0.16217041015625, 0.276885986328125, 0.3916015625, 0.506317138671875, 0.62103271484375, 0.735748291015625, 0.8504638671875, 0.965179443359375, 1.07989501953125, 1.194610595703125, 1.309326171875, 1.424041748046875, 1.53875732421875, 1.653472900390625, 1.7681884765625, 1.882904052734375, 1.99761962890625, 2.112335205078125, 2.22705078125, 2.341766357421875, 2.45648193359375, 2.571197509765625, 2.6859130859375, 2.800628662109375, 2.91534423828125, 3.030059814453125, 3.144775390625, 3.259490966796875, 3.37420654296875, 3.488922119140625, 3.6036376953125, 3.718353271484375, 3.83306884765625, 3.947784423828125, 4.0625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 3.0, 4.0, 2.0, 7.0, 8.0, 14.0, 12.0, 18.0, 29.0, 37.0, 57.0, 86.0, 113.0, 210.0, 304.0, 524.0, 1009.0, 2084.0, 5286.0, 17541.0, 70156.0, 275778.0, 444150.0, 171466.0, 41214.0, 11092.0, 3845.0, 1617.0, 773.0, 390.0, 243.0, 156.0, 103.0, 66.0, 46.0, 34.0, 21.0, 21.0, 12.0, 5.0, 12.0, 6.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.048797607421875, -0.04694318771362305, -0.045088768005371094, -0.04323434829711914, -0.04137992858886719, -0.039525508880615234, -0.03767108917236328, -0.03581666946411133, -0.033962249755859375, -0.03210783004760742, -0.03025341033935547, -0.028398990631103516, -0.026544570922851562, -0.02469015121459961, -0.022835731506347656, -0.020981311798095703, -0.01912689208984375, -0.017272472381591797, -0.015418052673339844, -0.01356363296508789, -0.011709213256835938, -0.009854793548583984, -0.008000373840332031, -0.006145954132080078, -0.004291534423828125, -0.002437114715576172, -0.0005826950073242188, 0.0012717247009277344, 0.0031261444091796875, 0.004980564117431641, 0.006834983825683594, 0.008689403533935547, 0.0105438232421875, 0.012398242950439453, 0.014252662658691406, 0.01610708236694336, 0.017961502075195312, 0.019815921783447266, 0.02167034149169922, 0.023524761199951172, 0.025379180908203125, 0.027233600616455078, 0.02908802032470703, 0.030942440032958984, 0.03279685974121094, 0.03465127944946289, 0.036505699157714844, 0.0383601188659668, 0.04021453857421875, 0.0420689582824707, 0.043923377990722656, 0.04577779769897461, 0.04763221740722656, 0.049486637115478516, 0.05134105682373047, 0.05319547653198242, 0.055049896240234375, 0.05690431594848633, 0.05875873565673828, 0.060613155364990234, 0.06246757507324219, 0.06432199478149414, 0.0661764144897461, 0.06803083419799805, 0.06988525390625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 5.0, 4.0, 12.0, 7.0, 29.0, 46.0, 68.0, 115.0, 126.0, 138.0, 150.0, 125.0, 77.0, 34.0, 32.0, 18.0, 13.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.8995018005371094e-05, -4.674401134252548e-05, -4.449300467967987e-05, -4.224199801683426e-05, -3.999099135398865e-05, -3.7739984691143036e-05, -3.5488978028297424e-05, -3.323797136545181e-05, -3.09869647026062e-05, -2.873595803976059e-05, -2.6484951376914978e-05, -2.4233944714069366e-05, -2.1982938051223755e-05, -1.9731931388378143e-05, -1.7480924725532532e-05, -1.522991806268692e-05, -1.2978911399841309e-05, -1.0727904736995697e-05, -8.476898074150085e-06, -6.225891411304474e-06, -3.974884748458862e-06, -1.7238780856132507e-06, 5.271285772323608e-07, 2.7781352400779724e-06, 5.029141902923584e-06, 7.2801485657691956e-06, 9.531155228614807e-06, 1.1782161891460419e-05, 1.403316855430603e-05, 1.6284175217151642e-05, 1.8535181879997253e-05, 2.0786188542842865e-05, 2.3037195205688477e-05, 2.5288201868534088e-05, 2.75392085313797e-05, 2.979021519422531e-05, 3.204122185707092e-05, 3.4292228519916534e-05, 3.6543235182762146e-05, 3.879424184560776e-05, 4.104524850845337e-05, 4.329625517129898e-05, 4.554726183414459e-05, 4.7798268496990204e-05, 5.0049275159835815e-05, 5.230028182268143e-05, 5.455128848552704e-05, 5.680229514837265e-05, 5.905330181121826e-05, 6.130430847406387e-05, 6.355531513690948e-05, 6.58063217997551e-05, 6.805732846260071e-05, 7.030833512544632e-05, 7.255934178829193e-05, 7.481034845113754e-05, 7.706135511398315e-05, 7.931236177682877e-05, 8.156336843967438e-05, 8.381437510251999e-05, 8.60653817653656e-05, 8.831638842821121e-05, 9.056739509105682e-05, 9.281840175390244e-05, 9.506940841674805e-05]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 6.0, 4.0, 5.0, 7.0, 4.0, 17.0, 22.0, 30.0, 41.0, 42.0, 68.0, 105.0, 174.0, 314.0, 556.0, 1181.0, 2614.0, 6800.0, 18623.0, 54137.0, 159157.0, 345160.0, 287296.0, 112392.0, 37786.0, 13044.0, 4932.0, 2005.0, 917.0, 437.0, 250.0, 133.0, 97.0, 49.0, 39.0, 33.0, 18.0, 18.0, 12.0, 5.0, 9.0, 8.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-0.045928955078125, -0.0445713996887207, -0.043213844299316406, -0.04185628890991211, -0.04049873352050781, -0.039141178131103516, -0.03778362274169922, -0.03642606735229492, -0.035068511962890625, -0.03371095657348633, -0.03235340118408203, -0.030995845794677734, -0.029638290405273438, -0.02828073501586914, -0.026923179626464844, -0.025565624237060547, -0.02420806884765625, -0.022850513458251953, -0.021492958068847656, -0.02013540267944336, -0.018777847290039062, -0.017420291900634766, -0.01606273651123047, -0.014705181121826172, -0.013347625732421875, -0.011990070343017578, -0.010632514953613281, -0.009274959564208984, -0.007917404174804688, -0.006559848785400391, -0.005202293395996094, -0.003844738006591797, -0.0024871826171875, -0.0011296272277832031, 0.00022792816162109375, 0.0015854835510253906, 0.0029430389404296875, 0.004300594329833984, 0.005658149719238281, 0.007015705108642578, 0.008373260498046875, 0.009730815887451172, 0.011088371276855469, 0.012445926666259766, 0.013803482055664062, 0.01516103744506836, 0.016518592834472656, 0.017876148223876953, 0.01923370361328125, 0.020591259002685547, 0.021948814392089844, 0.02330636978149414, 0.024663925170898438, 0.026021480560302734, 0.02737903594970703, 0.028736591339111328, 0.030094146728515625, 0.03145170211791992, 0.03280925750732422, 0.034166812896728516, 0.03552436828613281, 0.03688192367553711, 0.038239479064941406, 0.0395970344543457, 0.04095458984375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 4.0, 4.0, 6.0, 2.0, 4.0, 6.0, 4.0, 12.0, 12.0, 19.0, 26.0, 26.0, 26.0, 36.0, 43.0, 55.0, 59.0, 56.0, 65.0, 70.0, 70.0, 60.0, 63.0, 50.0, 43.0, 42.0, 26.0, 25.0, 12.0, 16.0, 10.0, 10.0, 13.0, 8.0, 7.0, 3.0, 4.0, 3.0, 1.0, 3.0, 4.0, 1.0], "bins": [-0.0199432373046875, -0.01945960521697998, -0.01897597312927246, -0.01849234104156494, -0.018008708953857422, -0.017525076866149902, -0.017041444778442383, -0.016557812690734863, -0.016074180603027344, -0.015590548515319824, -0.015106916427612305, -0.014623284339904785, -0.014139652252197266, -0.013656020164489746, -0.013172388076782227, -0.012688755989074707, -0.012205123901367188, -0.011721491813659668, -0.011237859725952148, -0.010754227638244629, -0.01027059555053711, -0.00978696346282959, -0.00930333137512207, -0.00881969928741455, -0.008336067199707031, -0.007852435111999512, -0.007368803024291992, -0.006885170936584473, -0.006401538848876953, -0.005917906761169434, -0.005434274673461914, -0.0049506425857543945, -0.004467010498046875, -0.0039833784103393555, -0.003499746322631836, -0.0030161142349243164, -0.002532482147216797, -0.0020488500595092773, -0.0015652179718017578, -0.0010815858840942383, -0.0005979537963867188, -0.00011432170867919922, 0.0003693103790283203, 0.0008529424667358398, 0.0013365745544433594, 0.001820206642150879, 0.0023038387298583984, 0.002787470817565918, 0.0032711029052734375, 0.003754734992980957, 0.0042383670806884766, 0.004721999168395996, 0.005205631256103516, 0.005689263343811035, 0.006172895431518555, 0.006656527519226074, 0.007140159606933594, 0.007623791694641113, 0.008107423782348633, 0.008591055870056152, 0.009074687957763672, 0.009558320045471191, 0.010041952133178711, 0.01052558422088623, 0.01100921630859375]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 7.0, 8.0, 41.0, 97.0, 197.0, 254.0, 221.0, 121.0, 44.0, 15.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.412555694580078, -9.185964584350586, -8.95937442779541, -8.732783317565918, -8.506192207336426, -8.279601097106934, -8.053010940551758, -7.826419830322266, -7.599828720092773, -7.3732380867004395, -7.146646976470947, -6.920056343078613, -6.693465232849121, -6.466874599456787, -6.240283966064453, -6.013692855834961, -5.787102222442627, -5.560511589050293, -5.333920478820801, -5.107329845428467, -4.880738735198975, -4.654148101806641, -4.427556991577148, -4.2009663581848145, -3.9743754863739014, -3.7477846145629883, -3.521193742752075, -3.294602870941162, -3.068012237548828, -2.841421127319336, -2.614830493927002, -2.388239622116089, -2.161648750305176, -1.9350578784942627, -1.7084670066833496, -1.481876254081726, -1.255285382270813, -1.0286945104599, -0.8021037578582764, -0.5755128860473633, -0.3489220142364502, -0.1223311722278595, 0.1042596697807312, 0.3308504819869995, 0.5574413537979126, 0.7840322256088257, 1.0106229782104492, 1.2372138500213623, 1.4638047218322754, 1.6903955936431885, 1.9169864654541016, 2.1435770988464355, 2.3701682090759277, 2.5967588424682617, 2.823349714279175, 3.049940586090088, 3.276531457901001, 3.503122329711914, 3.729713201522827, 3.9563040733337402, 4.182894706726074, 4.409485816955566, 4.6360764503479, 4.862667083740234, 5.089258193969727]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 4.0, 3.0, 4.0, 5.0, 5.0, 7.0, 12.0, 11.0, 20.0, 24.0, 22.0, 34.0, 30.0, 38.0, 52.0, 50.0, 53.0, 48.0, 47.0, 59.0, 72.0, 53.0, 59.0, 45.0, 40.0, 38.0, 39.0, 31.0, 24.0, 22.0, 14.0, 13.0, 10.0, 7.0, 2.0, 6.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5494000911712646, -1.480488896369934, -1.4115777015686035, -1.342666506767273, -1.2737553119659424, -1.2048442363739014, -1.1359330415725708, -1.0670218467712402, -0.9981106519699097, -0.9291994571685791, -0.8602882623672485, -0.7913771271705627, -0.7224659323692322, -0.6535547375679016, -0.5846436023712158, -0.5157324075698853, -0.4468212127685547, -0.3779100179672241, -0.30899885296821594, -0.24008767306804657, -0.1711764931678772, -0.10226529836654663, -0.03335413336753845, 0.03555703163146973, 0.10446822643280029, 0.17337940633296967, 0.24229058623313904, 0.3112017512321472, 0.3801129460334778, 0.44902414083480835, 0.5179352760314941, 0.5868464708328247, 0.6557574272155762, 0.7246686220169067, 0.7935798168182373, 0.8624909520149231, 0.9314021468162537, 1.0003132820129395, 1.06922447681427, 1.1381356716156006, 1.2070468664169312, 1.2759580612182617, 1.3448692560195923, 1.4137804508209229, 1.4826915264129639, 1.551602840423584, 1.620513916015625, 1.6894251108169556, 1.7583363056182861, 1.8272475004196167, 1.8961586952209473, 1.9650698900222778, 2.0339810848236084, 2.1028921604156494, 2.1718034744262695, 2.2407145500183105, 2.3096256256103516, 2.3785367012023926, 2.4474480152130127, 2.5163590908050537, 2.585270404815674, 2.654181480407715, 2.723092794418335, 2.792003870010376, 2.860915184020996]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 5.0, 7.0, 13.0, 14.0, 19.0, 43.0, 64.0, 107.0, 203.0, 438.0, 901.0, 2148.0, 4915.0, 13911.0, 45578.0, 179110.0, 519140.0, 205393.0, 51631.0, 15369.0, 5471.0, 2137.0, 974.0, 444.0, 219.0, 127.0, 74.0, 36.0, 14.0, 19.0, 13.0, 10.0, 3.0, 1.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.37890625, -2.311981201171875, -2.24505615234375, -2.178131103515625, -2.1112060546875, -2.044281005859375, -1.97735595703125, -1.910430908203125, -1.843505859375, -1.776580810546875, -1.70965576171875, -1.642730712890625, -1.5758056640625, -1.508880615234375, -1.44195556640625, -1.375030517578125, -1.30810546875, -1.241180419921875, -1.17425537109375, -1.107330322265625, -1.0404052734375, -0.973480224609375, -0.90655517578125, -0.839630126953125, -0.772705078125, -0.705780029296875, -0.63885498046875, -0.571929931640625, -0.5050048828125, -0.438079833984375, -0.37115478515625, -0.304229736328125, -0.2373046875, -0.170379638671875, -0.10345458984375, -0.036529541015625, 0.0303955078125, 0.097320556640625, 0.16424560546875, 0.231170654296875, 0.298095703125, 0.365020751953125, 0.43194580078125, 0.498870849609375, 0.5657958984375, 0.632720947265625, 0.69964599609375, 0.766571044921875, 0.83349609375, 0.900421142578125, 0.96734619140625, 1.034271240234375, 1.1011962890625, 1.168121337890625, 1.23504638671875, 1.301971435546875, 1.368896484375, 1.435821533203125, 1.50274658203125, 1.569671630859375, 1.6365966796875, 1.703521728515625, 1.77044677734375, 1.837371826171875, 1.904296875]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 7.0, 4.0, 5.0, 7.0, 5.0, 6.0, 14.0, 16.0, 12.0, 23.0, 22.0, 41.0, 30.0, 49.0, 50.0, 52.0, 48.0, 52.0, 50.0, 66.0, 69.0, 48.0, 52.0, 39.0, 42.0, 42.0, 21.0, 25.0, 18.0, 25.0, 13.0, 17.0, 11.0, 12.0, 6.0, 5.0, 5.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.513671875, -3.389129638671875, -3.26458740234375, -3.140045166015625, -3.0155029296875, -2.890960693359375, -2.76641845703125, -2.641876220703125, -2.517333984375, -2.392791748046875, -2.26824951171875, -2.143707275390625, -2.0191650390625, -1.894622802734375, -1.77008056640625, -1.645538330078125, -1.52099609375, -1.396453857421875, -1.27191162109375, -1.147369384765625, -1.0228271484375, -0.898284912109375, -0.77374267578125, -0.649200439453125, -0.524658203125, -0.400115966796875, -0.27557373046875, -0.151031494140625, -0.0264892578125, 0.098052978515625, 0.22259521484375, 0.347137451171875, 0.4716796875, 0.596221923828125, 0.72076416015625, 0.845306396484375, 0.9698486328125, 1.094390869140625, 1.21893310546875, 1.343475341796875, 1.468017578125, 1.592559814453125, 1.71710205078125, 1.841644287109375, 1.9661865234375, 2.090728759765625, 2.21527099609375, 2.339813232421875, 2.46435546875, 2.588897705078125, 2.71343994140625, 2.837982177734375, 2.9625244140625, 3.087066650390625, 3.21160888671875, 3.336151123046875, 3.460693359375, 3.585235595703125, 3.70977783203125, 3.834320068359375, 3.9588623046875, 4.083404541015625, 4.20794677734375, 4.332489013671875, 4.45703125]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 17.0, 21.0, 32.0, 39.0, 84.0, 108.0, 155.0, 237.0, 555.0, 3187.0, 217870.0, 816914.0, 7771.0, 798.0, 253.0, 190.0, 116.0, 72.0, 43.0, 34.0, 22.0, 9.0, 8.0, 8.0, 6.0, 4.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.3125, -10.06781005859375, -9.8231201171875, -9.57843017578125, -9.333740234375, -9.08905029296875, -8.8443603515625, -8.59967041015625, -8.35498046875, -8.11029052734375, -7.8656005859375, -7.62091064453125, -7.376220703125, -7.13153076171875, -6.8868408203125, -6.64215087890625, -6.3974609375, -6.15277099609375, -5.9080810546875, -5.66339111328125, -5.418701171875, -5.17401123046875, -4.9293212890625, -4.68463134765625, -4.43994140625, -4.19525146484375, -3.9505615234375, -3.70587158203125, -3.461181640625, -3.21649169921875, -2.9718017578125, -2.72711181640625, -2.482421875, -2.23773193359375, -1.9930419921875, -1.74835205078125, -1.503662109375, -1.25897216796875, -1.0142822265625, -0.76959228515625, -0.52490234375, -0.28021240234375, -0.0355224609375, 0.20916748046875, 0.453857421875, 0.69854736328125, 0.9432373046875, 1.18792724609375, 1.4326171875, 1.67730712890625, 1.9219970703125, 2.16668701171875, 2.411376953125, 2.65606689453125, 2.9007568359375, 3.14544677734375, 3.39013671875, 3.63482666015625, 3.8795166015625, 4.12420654296875, 4.368896484375, 4.61358642578125, 4.8582763671875, 5.10296630859375, 5.34765625]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 4.0, 12.0, 5.0, 6.0, 8.0, 7.0, 16.0, 12.0, 29.0, 29.0, 19.0, 24.0, 40.0, 41.0, 49.0, 44.0, 37.0, 56.0, 66.0, 48.0, 42.0, 50.0, 57.0, 37.0, 37.0, 44.0, 29.0, 30.0, 29.0, 26.0, 20.0, 13.0, 10.0, 13.0, 8.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.01171875, -4.86651611328125, -4.7213134765625, -4.57611083984375, -4.430908203125, -4.28570556640625, -4.1405029296875, -3.99530029296875, -3.85009765625, -3.70489501953125, -3.5596923828125, -3.41448974609375, -3.269287109375, -3.12408447265625, -2.9788818359375, -2.83367919921875, -2.6884765625, -2.54327392578125, -2.3980712890625, -2.25286865234375, -2.107666015625, -1.96246337890625, -1.8172607421875, -1.67205810546875, -1.52685546875, -1.38165283203125, -1.2364501953125, -1.09124755859375, -0.946044921875, -0.80084228515625, -0.6556396484375, -0.51043701171875, -0.365234375, -0.22003173828125, -0.0748291015625, 0.07037353515625, 0.215576171875, 0.36077880859375, 0.5059814453125, 0.65118408203125, 0.79638671875, 0.94158935546875, 1.0867919921875, 1.23199462890625, 1.377197265625, 1.52239990234375, 1.6676025390625, 1.81280517578125, 1.9580078125, 2.10321044921875, 2.2484130859375, 2.39361572265625, 2.538818359375, 2.68402099609375, 2.8292236328125, 2.97442626953125, 3.11962890625, 3.26483154296875, 3.4100341796875, 3.55523681640625, 3.700439453125, 3.84564208984375, 3.9908447265625, 4.13604736328125, 4.28125]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 2.0, 4.0, 4.0, 4.0, 3.0, 3.0, 9.0, 9.0, 9.0, 18.0, 31.0, 45.0, 80.0, 187.0, 397.0, 1134.0, 3920.0, 23560.0, 897257.0, 112314.0, 6647.0, 1795.0, 585.0, 254.0, 101.0, 58.0, 36.0, 24.0, 14.0, 11.0, 4.0, 8.0, 5.0, 4.0, 2.0, 1.0, 6.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-2.537109375, -2.459503173828125, -2.38189697265625, -2.304290771484375, -2.2266845703125, -2.149078369140625, -2.07147216796875, -1.993865966796875, -1.916259765625, -1.838653564453125, -1.76104736328125, -1.683441162109375, -1.6058349609375, -1.528228759765625, -1.45062255859375, -1.373016357421875, -1.29541015625, -1.217803955078125, -1.14019775390625, -1.062591552734375, -0.9849853515625, -0.907379150390625, -0.82977294921875, -0.752166748046875, -0.674560546875, -0.596954345703125, -0.51934814453125, -0.441741943359375, -0.3641357421875, -0.286529541015625, -0.20892333984375, -0.131317138671875, -0.0537109375, 0.023895263671875, 0.10150146484375, 0.179107666015625, 0.2567138671875, 0.334320068359375, 0.41192626953125, 0.489532470703125, 0.567138671875, 0.644744873046875, 0.72235107421875, 0.799957275390625, 0.8775634765625, 0.955169677734375, 1.03277587890625, 1.110382080078125, 1.18798828125, 1.265594482421875, 1.34320068359375, 1.420806884765625, 1.4984130859375, 1.576019287109375, 1.65362548828125, 1.731231689453125, 1.808837890625, 1.886444091796875, 1.96405029296875, 2.041656494140625, 2.1192626953125, 2.196868896484375, 2.27447509765625, 2.352081298828125, 2.4296875]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 7.0, 26.0, 39.0, 73.0, 171.0, 334.0, 177.0, 95.0, 45.0, 17.0, 10.0, 3.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.0006976127624511719, -0.000683516263961792, -0.0006694197654724121, -0.0006553232669830322, -0.0006412267684936523, -0.0006271302700042725, -0.0006130337715148926, -0.0005989372730255127, -0.0005848407745361328, -0.0005707442760467529, -0.000556647777557373, -0.0005425512790679932, -0.0005284547805786133, -0.0005143582820892334, -0.0005002617835998535, -0.00048616528511047363, -0.00047206878662109375, -0.00045797228813171387, -0.000443875789642334, -0.0004297792911529541, -0.0004156827926635742, -0.00040158629417419434, -0.00038748979568481445, -0.00037339329719543457, -0.0003592967987060547, -0.0003452003002166748, -0.0003311038017272949, -0.00031700730323791504, -0.00030291080474853516, -0.0002888143062591553, -0.0002747178077697754, -0.0002606213092803955, -0.0002465248107910156, -0.00023242831230163574, -0.00021833181381225586, -0.00020423531532287598, -0.0001901388168334961, -0.0001760423183441162, -0.00016194581985473633, -0.00014784932136535645, -0.00013375282287597656, -0.00011965632438659668, -0.0001055598258972168, -9.146332740783691e-05, -7.736682891845703e-05, -6.327033042907715e-05, -4.9173831939697266e-05, -3.507733345031738e-05, -2.09808349609375e-05, -6.884336471557617e-06, 7.212162017822266e-06, 2.130866050720215e-05, 3.540515899658203e-05, 4.9501657485961914e-05, 6.35981559753418e-05, 7.769465446472168e-05, 9.179115295410156e-05, 0.00010588765144348145, 0.00011998414993286133, 0.0001340806484222412, 0.0001481771469116211, 0.00016227364540100098, 0.00017637014389038086, 0.00019046664237976074, 0.00020456314086914062]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 5.0, 4.0, 5.0, 4.0, 6.0, 9.0, 12.0, 5.0, 12.0, 29.0, 60.0, 94.0, 166.0, 402.0, 1000.0, 4329.0, 64989.0, 941860.0, 30881.0, 3203.0, 779.0, 336.0, 162.0, 92.0, 41.0, 19.0, 17.0, 12.0, 10.0, 7.0, 3.0, 1.0, 5.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.408203125, -2.320343017578125, -2.23248291015625, -2.144622802734375, -2.0567626953125, -1.968902587890625, -1.88104248046875, -1.793182373046875, -1.705322265625, -1.617462158203125, -1.52960205078125, -1.441741943359375, -1.3538818359375, -1.266021728515625, -1.17816162109375, -1.090301513671875, -1.00244140625, -0.914581298828125, -0.82672119140625, -0.738861083984375, -0.6510009765625, -0.563140869140625, -0.47528076171875, -0.387420654296875, -0.299560546875, -0.211700439453125, -0.12384033203125, -0.035980224609375, 0.0518798828125, 0.139739990234375, 0.22760009765625, 0.315460205078125, 0.4033203125, 0.491180419921875, 0.57904052734375, 0.666900634765625, 0.7547607421875, 0.842620849609375, 0.93048095703125, 1.018341064453125, 1.106201171875, 1.194061279296875, 1.28192138671875, 1.369781494140625, 1.4576416015625, 1.545501708984375, 1.63336181640625, 1.721221923828125, 1.80908203125, 1.896942138671875, 1.98480224609375, 2.072662353515625, 2.1605224609375, 2.248382568359375, 2.33624267578125, 2.424102783203125, 2.511962890625, 2.599822998046875, 2.68768310546875, 2.775543212890625, 2.8634033203125, 2.951263427734375, 3.03912353515625, 3.126983642578125, 3.21484375]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 3.0, 8.0, 2.0, 12.0, 10.0, 10.0, 15.0, 19.0, 28.0, 46.0, 48.0, 76.0, 87.0, 117.0, 108.0, 74.0, 69.0, 62.0, 48.0, 39.0, 23.0, 21.0, 11.0, 15.0, 7.0, 6.0, 4.0, 0.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.37353515625, -0.3606605529785156, -0.34778594970703125, -0.3349113464355469, -0.3220367431640625, -0.3091621398925781, -0.29628753662109375, -0.2834129333496094, -0.270538330078125, -0.2576637268066406, -0.24478912353515625, -0.23191452026367188, -0.2190399169921875, -0.20616531372070312, -0.19329071044921875, -0.18041610717773438, -0.16754150390625, -0.15466690063476562, -0.14179229736328125, -0.12891769409179688, -0.1160430908203125, -0.10316848754882812, -0.09029388427734375, -0.07741928100585938, -0.064544677734375, -0.051670074462890625, -0.03879547119140625, -0.025920867919921875, -0.0130462646484375, -0.000171661376953125, 0.01270294189453125, 0.025577545166015625, 0.0384521484375, 0.051326751708984375, 0.06420135498046875, 0.07707595825195312, 0.0899505615234375, 0.10282516479492188, 0.11569976806640625, 0.12857437133789062, 0.141448974609375, 0.15432357788085938, 0.16719818115234375, 0.18007278442382812, 0.1929473876953125, 0.20582199096679688, 0.21869659423828125, 0.23157119750976562, 0.24444580078125, 0.2573204040527344, 0.27019500732421875, 0.2830696105957031, 0.2959442138671875, 0.3088188171386719, 0.32169342041015625, 0.3345680236816406, 0.347442626953125, 0.3603172302246094, 0.37319183349609375, 0.3860664367675781, 0.3989410400390625, 0.4118156433105469, 0.42469024658203125, 0.4375648498535156, 0.450439453125]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 8.0, 11.0, 13.0, 46.0, 69.0, 111.0, 161.0, 150.0, 176.0, 114.0, 66.0, 51.0, 13.0, 11.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.608284950256348, -8.32614803314209, -8.044010162353516, -7.7618727684021, -7.479735374450684, -7.197598457336426, -6.91546106338501, -6.633323669433594, -6.351186275482178, -6.069048881530762, -5.786911487579346, -5.50477409362793, -5.222637176513672, -4.940499305725098, -4.65836238861084, -4.376224994659424, -4.094087600708008, -3.811950206756592, -3.529812812805176, -3.247675657272339, -2.965538263320923, -2.683400869369507, -2.40126371383667, -2.119126319885254, -1.836988925933838, -1.5548515319824219, -1.2727142572402954, -0.9905769228935242, -0.7084395885467529, -0.4263021945953369, -0.14416491985321045, 0.13797235488891602, 0.4201087951660156, 0.7022461295127869, 0.9843834638595581, 1.2665207386016846, 1.5486581325531006, 1.8307955265045166, 2.1129326820373535, 2.3950700759887695, 2.6772074699401855, 2.9593448638916016, 3.2414822578430176, 3.5236194133758545, 3.8057568073272705, 4.087894439697266, 4.370031356811523, 4.6521687507629395, 4.9343061447143555, 5.2164435386657715, 5.4985809326171875, 5.7807183265686035, 6.0628557205200195, 6.344992637634277, 6.627130031585693, 6.909267425537109, 7.191404819488525, 7.473542213439941, 7.755679607391357, 8.037817001342773, 8.319953918457031, 8.602091789245605, 8.884228706359863, 9.166366577148438, 9.448503494262695]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 3.0, 1.0, 6.0, 4.0, 7.0, 13.0, 16.0, 11.0, 18.0, 16.0, 20.0, 30.0, 29.0, 28.0, 28.0, 26.0, 38.0, 44.0, 44.0, 37.0, 32.0, 46.0, 32.0, 46.0, 43.0, 33.0, 46.0, 38.0, 43.0, 34.0, 30.0, 23.0, 28.0, 16.0, 12.0, 21.0, 10.0, 13.0, 10.0, 6.0, 6.0, 4.0, 4.0, 8.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.823061943054199, -5.629883289337158, -5.436705112457275, -5.243526458740234, -5.050347805023193, -4.857169151306152, -4.6639909744262695, -4.4708123207092285, -4.2776336669921875, -4.0844550132751465, -3.8912765979766846, -3.6980981826782227, -3.5049195289611816, -3.3117411136627197, -3.118562698364258, -2.925384044647217, -2.732205629348755, -2.539027214050293, -2.345848560333252, -2.15267014503479, -1.959491491317749, -1.766313076019287, -1.5731345415115356, -1.3799560070037842, -1.1867774724960327, -0.9935989379882812, -0.8004204034805298, -0.6072419285774231, -0.41406339406967163, -0.22088485956192017, -0.027706384658813477, 0.165472149848938, 0.35865068435668945, 0.5518292188644409, 0.7450077533721924, 0.9381862282752991, 1.1313648223876953, 1.3245432376861572, 1.5177217721939087, 1.7109003067016602, 1.9040788412094116, 2.097257375717163, 2.290435791015625, 2.483614444732666, 2.676792860031128, 2.869971513748169, 3.063149929046631, 3.256328582763672, 3.449506998062134, 3.6426854133605957, 3.8358640670776367, 4.029042720794678, 4.2222208976745605, 4.415399551391602, 4.608578205108643, 4.801756858825684, 4.994935035705566, 5.188113689422607, 5.38129186630249, 5.574470520019531, 5.767649173736572, 5.960827827453613, 6.154006004333496, 6.347184658050537, 6.540363311767578]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 7.0, 7.0, 5.0, 13.0, 21.0, 30.0, 41.0, 67.0, 109.0, 186.0, 267.0, 505.0, 950.0, 2857.0, 25749.0, 1092606.0, 2979991.0, 83981.0, 4663.0, 1034.0, 437.0, 252.0, 165.0, 113.0, 73.0, 47.0, 33.0, 22.0, 23.0, 15.0, 3.0, 5.0, 2.0, 2.0, 3.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.98046875, -6.7762451171875, -6.572021484375, -6.3677978515625, -6.16357421875, -5.9593505859375, -5.755126953125, -5.5509033203125, -5.3466796875, -5.1424560546875, -4.938232421875, -4.7340087890625, -4.52978515625, -4.3255615234375, -4.121337890625, -3.9171142578125, -3.712890625, -3.5086669921875, -3.304443359375, -3.1002197265625, -2.89599609375, -2.6917724609375, -2.487548828125, -2.2833251953125, -2.0791015625, -1.8748779296875, -1.670654296875, -1.4664306640625, -1.26220703125, -1.0579833984375, -0.853759765625, -0.6495361328125, -0.4453125, -0.2410888671875, -0.036865234375, 0.1673583984375, 0.37158203125, 0.5758056640625, 0.780029296875, 0.9842529296875, 1.1884765625, 1.3927001953125, 1.596923828125, 1.8011474609375, 2.00537109375, 2.2095947265625, 2.413818359375, 2.6180419921875, 2.822265625, 3.0264892578125, 3.230712890625, 3.4349365234375, 3.63916015625, 3.8433837890625, 4.047607421875, 4.2518310546875, 4.4560546875, 4.6602783203125, 4.864501953125, 5.0687255859375, 5.27294921875, 5.4771728515625, 5.681396484375, 5.8856201171875, 6.08984375]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 5.0, 3.0, 3.0, 6.0, 5.0, 9.0, 20.0, 19.0, 22.0, 25.0, 41.0, 42.0, 50.0, 58.0, 54.0, 73.0, 74.0, 73.0, 70.0, 69.0, 61.0, 51.0, 49.0, 44.0, 24.0, 17.0, 15.0, 7.0, 8.0, 9.0, 1.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.91015625, -1.8138427734375, -1.717529296875, -1.6212158203125, -1.52490234375, -1.4285888671875, -1.332275390625, -1.2359619140625, -1.1396484375, -1.0433349609375, -0.947021484375, -0.8507080078125, -0.75439453125, -0.6580810546875, -0.561767578125, -0.4654541015625, -0.369140625, -0.2728271484375, -0.176513671875, -0.0802001953125, 0.01611328125, 0.1124267578125, 0.208740234375, 0.3050537109375, 0.4013671875, 0.4976806640625, 0.593994140625, 0.6903076171875, 0.78662109375, 0.8829345703125, 0.979248046875, 1.0755615234375, 1.171875, 1.2681884765625, 1.364501953125, 1.4608154296875, 1.55712890625, 1.6534423828125, 1.749755859375, 1.8460693359375, 1.9423828125, 2.0386962890625, 2.135009765625, 2.2313232421875, 2.32763671875, 2.4239501953125, 2.520263671875, 2.6165771484375, 2.712890625, 2.8092041015625, 2.905517578125, 3.0018310546875, 3.09814453125, 3.1944580078125, 3.290771484375, 3.3870849609375, 3.4833984375, 3.5797119140625, 3.676025390625, 3.7723388671875, 3.86865234375, 3.9649658203125, 4.061279296875, 4.1575927734375, 4.25390625]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 2.0, 6.0, 5.0, 9.0, 17.0, 10.0, 26.0, 42.0, 66.0, 104.0, 176.0, 332.0, 636.0, 1563.0, 4192.0, 18862.0, 257975.0, 3484585.0, 392401.0, 24794.0, 5067.0, 1736.0, 798.0, 349.0, 198.0, 116.0, 68.0, 38.0, 35.0, 17.0, 16.0, 15.0, 12.0, 5.0, 2.0, 3.0, 5.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.970703125, -2.832916259765625, -2.69512939453125, -2.557342529296875, -2.4195556640625, -2.281768798828125, -2.14398193359375, -2.006195068359375, -1.868408203125, -1.730621337890625, -1.59283447265625, -1.455047607421875, -1.3172607421875, -1.179473876953125, -1.04168701171875, -0.903900146484375, -0.76611328125, -0.628326416015625, -0.49053955078125, -0.352752685546875, -0.2149658203125, -0.077178955078125, 0.06060791015625, 0.198394775390625, 0.336181640625, 0.473968505859375, 0.61175537109375, 0.749542236328125, 0.8873291015625, 1.025115966796875, 1.16290283203125, 1.300689697265625, 1.4384765625, 1.576263427734375, 1.71405029296875, 1.851837158203125, 1.9896240234375, 2.127410888671875, 2.26519775390625, 2.402984619140625, 2.540771484375, 2.678558349609375, 2.81634521484375, 2.954132080078125, 3.0919189453125, 3.229705810546875, 3.36749267578125, 3.505279541015625, 3.64306640625, 3.780853271484375, 3.91864013671875, 4.056427001953125, 4.1942138671875, 4.332000732421875, 4.46978759765625, 4.607574462890625, 4.745361328125, 4.883148193359375, 5.02093505859375, 5.158721923828125, 5.2965087890625, 5.434295654296875, 5.57208251953125, 5.709869384765625, 5.84765625]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 4.0, 2.0, 2.0, 7.0, 7.0, 4.0, 9.0, 16.0, 15.0, 33.0, 41.0, 63.0, 88.0, 122.0, 174.0, 255.0, 353.0, 465.0, 504.0, 504.0, 464.0, 296.0, 203.0, 133.0, 95.0, 63.0, 48.0, 35.0, 20.0, 18.0, 8.0, 3.0, 9.0, 3.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.2001953125, -1.1699066162109375, -1.139617919921875, -1.1093292236328125, -1.07904052734375, -1.0487518310546875, -1.018463134765625, -0.9881744384765625, -0.9578857421875, -0.9275970458984375, -0.897308349609375, -0.8670196533203125, -0.83673095703125, -0.8064422607421875, -0.776153564453125, -0.7458648681640625, -0.715576171875, -0.6852874755859375, -0.654998779296875, -0.6247100830078125, -0.59442138671875, -0.5641326904296875, -0.533843994140625, -0.5035552978515625, -0.4732666015625, -0.4429779052734375, -0.412689208984375, -0.3824005126953125, -0.35211181640625, -0.3218231201171875, -0.291534423828125, -0.2612457275390625, -0.23095703125, -0.2006683349609375, -0.170379638671875, -0.1400909423828125, -0.10980224609375, -0.0795135498046875, -0.049224853515625, -0.0189361572265625, 0.0113525390625, 0.0416412353515625, 0.071929931640625, 0.1022186279296875, 0.13250732421875, 0.1627960205078125, 0.193084716796875, 0.2233734130859375, 0.253662109375, 0.2839508056640625, 0.314239501953125, 0.3445281982421875, 0.37481689453125, 0.4051055908203125, 0.435394287109375, 0.4656829833984375, 0.4959716796875, 0.5262603759765625, 0.556549072265625, 0.5868377685546875, 0.61712646484375, 0.6474151611328125, 0.677703857421875, 0.7079925537109375, 0.73828125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 14.0, 17.0, 30.0, 55.0, 86.0, 135.0, 148.0, 125.0, 135.0, 115.0, 50.0, 43.0, 18.0, 14.0, 12.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3709821701049805, -5.174742221832275, -4.97850227355957, -4.782262802124023, -4.586022853851318, -4.389782905578613, -4.193542957305908, -3.997303009033203, -3.801063060760498, -3.604823112487793, -3.408583402633667, -3.212343454360962, -3.016103506088257, -2.819863796234131, -2.623623847961426, -2.4273838996887207, -2.2311441898345947, -2.0349042415618896, -1.8386644124984741, -1.6424245834350586, -1.4461846351623535, -1.249944806098938, -1.0537049770355225, -0.8574650287628174, -0.6612251996994019, -0.46498531103134155, -0.26874545216560364, -0.07250559329986572, 0.12373429536819458, 0.3199741840362549, 0.5162140130996704, 0.7124539613723755, 0.908693790435791, 1.1049336194992065, 1.3011735677719116, 1.4974133968353271, 1.6936533451080322, 1.8898931741714478, 2.0861330032348633, 2.2823729515075684, 2.4786128997802734, 2.6748528480529785, 2.8710925579071045, 3.0673325061798096, 3.2635724544525146, 3.4598121643066406, 3.6560521125793457, 3.852292060852051, 4.048531532287598, 4.244771480560303, 4.441011428833008, 4.637250900268555, 4.83349084854126, 5.029730796813965, 5.22597074508667, 5.422210693359375, 5.61845064163208, 5.814690589904785, 6.01093053817749, 6.207170486450195, 6.403409957885742, 6.599649906158447, 6.795889854431152, 6.992129802703857, 7.1883697509765625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 2.0, 3.0, 5.0, 9.0, 7.0, 10.0, 10.0, 9.0, 12.0, 15.0, 21.0, 22.0, 34.0, 28.0, 42.0, 34.0, 27.0, 46.0, 39.0, 57.0, 44.0, 48.0, 41.0, 62.0, 50.0, 37.0, 34.0, 43.0, 38.0, 22.0, 24.0, 26.0, 14.0, 17.0, 12.0, 12.0, 12.0, 9.0, 6.0, 4.0, 7.0, 7.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.063088893890381, -1.9899500608444214, -1.916811227798462, -1.8436723947525024, -1.770533561706543, -1.697394609451294, -1.6242557764053345, -1.551116943359375, -1.4779781103134155, -1.404839277267456, -1.3317004442214966, -1.258561611175537, -1.185422658920288, -1.1122839450836182, -1.0391449928283691, -0.9660061597824097, -0.8928673267364502, -0.8197284936904907, -0.7465896606445312, -0.673450767993927, -0.6003119349479675, -0.5271731019020081, -0.4540342390537262, -0.38089537620544434, -0.30775654315948486, -0.2346176952123642, -0.16147884726524353, -0.08833999931812286, -0.015201151371002197, 0.057937681674957275, 0.13107654452323914, 0.204215407371521, 0.27735424041748047, 0.35049307346343994, 0.4236319363117218, 0.49677079916000366, 0.5699096322059631, 0.6430484652519226, 0.7161873579025269, 0.7893261909484863, 0.8624650239944458, 0.9356038570404053, 1.0087426900863647, 1.0818815231323242, 1.1550204753875732, 1.2281591892242432, 1.3012981414794922, 1.3744369745254517, 1.4475758075714111, 1.5207146406173706, 1.59385347366333, 1.6669923067092896, 1.740131139755249, 1.813270092010498, 1.8864089250564575, 1.959547758102417, 2.032686710357666, 2.105825662612915, 2.178964376449585, 2.252103328704834, 2.325242042541504, 2.398380994796753, 2.471519708633423, 2.544658660888672, 2.617797374725342]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 5.0, 9.0, 8.0, 6.0, 8.0, 16.0, 19.0, 25.0, 29.0, 66.0, 107.0, 162.0, 249.0, 451.0, 741.0, 1430.0, 3065.0, 6910.0, 16624.0, 43500.0, 125590.0, 310545.0, 324384.0, 135526.0, 47493.0, 17652.0, 7229.0, 3170.0, 1560.0, 793.0, 456.0, 246.0, 156.0, 84.0, 79.0, 53.0, 36.0, 20.0, 11.0, 15.0, 9.0, 9.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.424072265625, -0.4099540710449219, -0.39583587646484375, -0.3817176818847656, -0.3675994873046875, -0.3534812927246094, -0.33936309814453125, -0.3252449035644531, -0.311126708984375, -0.2970085144042969, -0.28289031982421875, -0.2687721252441406, -0.2546539306640625, -0.24053573608398438, -0.22641754150390625, -0.21229934692382812, -0.19818115234375, -0.18406295776367188, -0.16994476318359375, -0.15582656860351562, -0.1417083740234375, -0.12759017944335938, -0.11347198486328125, -0.09935379028320312, -0.085235595703125, -0.07111740112304688, -0.05699920654296875, -0.042881011962890625, -0.0287628173828125, -0.014644622802734375, -0.00052642822265625, 0.013591766357421875, 0.0277099609375, 0.041828155517578125, 0.05594635009765625, 0.07006454467773438, 0.0841827392578125, 0.09830093383789062, 0.11241912841796875, 0.12653732299804688, 0.140655517578125, 0.15477371215820312, 0.16889190673828125, 0.18301010131835938, 0.1971282958984375, 0.21124649047851562, 0.22536468505859375, 0.23948287963867188, 0.25360107421875, 0.2677192687988281, 0.28183746337890625, 0.2959556579589844, 0.3100738525390625, 0.3241920471191406, 0.33831024169921875, 0.3524284362792969, 0.366546630859375, 0.3806648254394531, 0.39478302001953125, 0.4089012145996094, 0.4230194091796875, 0.4371376037597656, 0.45125579833984375, 0.4653739929199219, 0.4794921875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 8.0, 2.0, 2.0, 7.0, 10.0, 7.0, 15.0, 9.0, 26.0, 23.0, 22.0, 18.0, 33.0, 36.0, 43.0, 37.0, 49.0, 48.0, 51.0, 49.0, 59.0, 52.0, 36.0, 46.0, 47.0, 50.0, 31.0, 29.0, 26.0, 22.0, 15.0, 15.0, 18.0, 13.0, 8.0, 5.0, 12.0, 5.0, 5.0, 7.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5244140625, -1.4734344482421875, -1.422454833984375, -1.3714752197265625, -1.32049560546875, -1.2695159912109375, -1.218536376953125, -1.1675567626953125, -1.1165771484375, -1.0655975341796875, -1.014617919921875, -0.9636383056640625, -0.91265869140625, -0.8616790771484375, -0.810699462890625, -0.7597198486328125, -0.708740234375, -0.6577606201171875, -0.606781005859375, -0.5558013916015625, -0.50482177734375, -0.4538421630859375, -0.402862548828125, -0.3518829345703125, -0.3009033203125, -0.2499237060546875, -0.198944091796875, -0.1479644775390625, -0.09698486328125, -0.0460052490234375, 0.004974365234375, 0.0559539794921875, 0.10693359375, 0.1579132080078125, 0.208892822265625, 0.2598724365234375, 0.31085205078125, 0.3618316650390625, 0.412811279296875, 0.4637908935546875, 0.5147705078125, 0.5657501220703125, 0.616729736328125, 0.6677093505859375, 0.71868896484375, 0.7696685791015625, 0.820648193359375, 0.8716278076171875, 0.922607421875, 0.9735870361328125, 1.024566650390625, 1.0755462646484375, 1.12652587890625, 1.1775054931640625, 1.228485107421875, 1.2794647216796875, 1.3304443359375, 1.3814239501953125, 1.432403564453125, 1.4833831787109375, 1.53436279296875, 1.5853424072265625, 1.636322021484375, 1.6873016357421875, 1.73828125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 10.0, 8.0, 17.0, 22.0, 33.0, 38.0, 58.0, 82.0, 128.0, 207.0, 321.0, 514.0, 850.0, 1251.0, 2073.0, 3647.0, 5992.0, 9830.0, 16471.0, 27862.0, 46777.0, 76564.0, 120267.0, 164654.0, 178530.0, 145444.0, 97520.0, 59992.0, 35978.0, 21432.0, 12702.0, 7763.0, 4612.0, 2736.0, 1598.0, 1021.0, 561.0, 334.0, 238.0, 145.0, 100.0, 58.0, 51.0, 31.0, 10.0, 10.0, 5.0, 7.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.1871337890625, -0.18150711059570312, -0.17588043212890625, -0.17025375366210938, -0.1646270751953125, -0.15900039672851562, -0.15337371826171875, -0.14774703979492188, -0.142120361328125, -0.13649368286132812, -0.13086700439453125, -0.12524032592773438, -0.1196136474609375, -0.11398696899414062, -0.10836029052734375, -0.10273361206054688, -0.09710693359375, -0.09148025512695312, -0.08585357666015625, -0.08022689819335938, -0.0746002197265625, -0.06897354125976562, -0.06334686279296875, -0.057720184326171875, -0.052093505859375, -0.046466827392578125, -0.04084014892578125, -0.035213470458984375, -0.0295867919921875, -0.023960113525390625, -0.01833343505859375, -0.012706756591796875, -0.007080078125, -0.001453399658203125, 0.00417327880859375, 0.009799957275390625, 0.0154266357421875, 0.021053314208984375, 0.02667999267578125, 0.032306671142578125, 0.037933349609375, 0.043560028076171875, 0.04918670654296875, 0.054813385009765625, 0.0604400634765625, 0.06606674194335938, 0.07169342041015625, 0.07732009887695312, 0.08294677734375, 0.08857345581054688, 0.09420013427734375, 0.09982681274414062, 0.1054534912109375, 0.11108016967773438, 0.11670684814453125, 0.12233352661132812, 0.127960205078125, 0.13358688354492188, 0.13921356201171875, 0.14484024047851562, 0.1504669189453125, 0.15609359741210938, 0.16172027587890625, 0.16734695434570312, 0.1729736328125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 6.0, 4.0, 4.0, 7.0, 10.0, 9.0, 12.0, 15.0, 19.0, 19.0, 22.0, 24.0, 28.0, 41.0, 31.0, 41.0, 41.0, 56.0, 51.0, 53.0, 53.0, 49.0, 47.0, 48.0, 41.0, 38.0, 36.0, 44.0, 30.0, 24.0, 23.0, 21.0, 12.0, 11.0, 8.0, 12.0, 6.0, 5.0, 3.0, 5.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.794921875, -3.69366455078125, -3.5924072265625, -3.49114990234375, -3.389892578125, -3.28863525390625, -3.1873779296875, -3.08612060546875, -2.98486328125, -2.88360595703125, -2.7823486328125, -2.68109130859375, -2.579833984375, -2.47857666015625, -2.3773193359375, -2.27606201171875, -2.1748046875, -2.07354736328125, -1.9722900390625, -1.87103271484375, -1.769775390625, -1.66851806640625, -1.5672607421875, -1.46600341796875, -1.36474609375, -1.26348876953125, -1.1622314453125, -1.06097412109375, -0.959716796875, -0.85845947265625, -0.7572021484375, -0.65594482421875, -0.5546875, -0.45343017578125, -0.3521728515625, -0.25091552734375, -0.149658203125, -0.04840087890625, 0.0528564453125, 0.15411376953125, 0.25537109375, 0.35662841796875, 0.4578857421875, 0.55914306640625, 0.660400390625, 0.76165771484375, 0.8629150390625, 0.96417236328125, 1.0654296875, 1.16668701171875, 1.2679443359375, 1.36920166015625, 1.470458984375, 1.57171630859375, 1.6729736328125, 1.77423095703125, 1.87548828125, 1.97674560546875, 2.0780029296875, 2.17926025390625, 2.280517578125, 2.38177490234375, 2.4830322265625, 2.58428955078125, 2.685546875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 5.0, 6.0, 11.0, 13.0, 35.0, 37.0, 72.0, 124.0, 218.0, 368.0, 790.0, 1735.0, 5217.0, 20397.0, 113813.0, 479533.0, 342577.0, 64532.0, 12596.0, 3742.0, 1310.0, 635.0, 338.0, 196.0, 108.0, 63.0, 31.0, 20.0, 15.0, 10.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.07769775390625, -0.07569742202758789, -0.07369709014892578, -0.07169675827026367, -0.06969642639160156, -0.06769609451293945, -0.06569576263427734, -0.06369543075561523, -0.061695098876953125, -0.059694766998291016, -0.057694435119628906, -0.0556941032409668, -0.05369377136230469, -0.05169343948364258, -0.04969310760498047, -0.04769277572631836, -0.04569244384765625, -0.04369211196899414, -0.04169178009033203, -0.03969144821166992, -0.03769111633300781, -0.0356907844543457, -0.033690452575683594, -0.031690120697021484, -0.029689788818359375, -0.027689456939697266, -0.025689125061035156, -0.023688793182373047, -0.021688461303710938, -0.019688129425048828, -0.01768779754638672, -0.01568746566772461, -0.0136871337890625, -0.01168680191040039, -0.009686470031738281, -0.007686138153076172, -0.0056858062744140625, -0.003685474395751953, -0.0016851425170898438, 0.0003151893615722656, 0.002315521240234375, 0.004315853118896484, 0.006316184997558594, 0.008316516876220703, 0.010316848754882812, 0.012317180633544922, 0.014317512512207031, 0.01631784439086914, 0.01831817626953125, 0.02031850814819336, 0.02231884002685547, 0.024319171905517578, 0.026319503784179688, 0.028319835662841797, 0.030320167541503906, 0.032320499420166016, 0.034320831298828125, 0.036321163177490234, 0.038321495056152344, 0.04032182693481445, 0.04232215881347656, 0.04432249069213867, 0.04632282257080078, 0.04832315444946289, 0.050323486328125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 7.0, 4.0, 6.0, 11.0, 16.0, 19.0, 37.0, 37.0, 65.0, 62.0, 83.0, 118.0, 110.0, 86.0, 79.0, 59.0, 49.0, 46.0, 26.0, 22.0, 13.0, 9.0, 13.0, 12.0, 2.0, 6.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.553794860839844e-05, -4.435330629348755e-05, -4.316866397857666e-05, -4.198402166366577e-05, -4.079937934875488e-05, -3.9614737033843994e-05, -3.8430094718933105e-05, -3.724545240402222e-05, -3.606081008911133e-05, -3.487616777420044e-05, -3.369152545928955e-05, -3.250688314437866e-05, -3.1322240829467773e-05, -3.0137598514556885e-05, -2.8952956199645996e-05, -2.7768313884735107e-05, -2.658367156982422e-05, -2.539902925491333e-05, -2.421438694000244e-05, -2.3029744625091553e-05, -2.1845102310180664e-05, -2.0660459995269775e-05, -1.9475817680358887e-05, -1.8291175365447998e-05, -1.710653305053711e-05, -1.592189073562622e-05, -1.4737248420715332e-05, -1.3552606105804443e-05, -1.2367963790893555e-05, -1.1183321475982666e-05, -9.998679161071777e-06, -8.814036846160889e-06, -7.62939453125e-06, -6.444752216339111e-06, -5.260109901428223e-06, -4.075467586517334e-06, -2.8908252716064453e-06, -1.7061829566955566e-06, -5.21540641784668e-07, 6.631016731262207e-07, 1.8477439880371094e-06, 3.032386302947998e-06, 4.217028617858887e-06, 5.401670932769775e-06, 6.586313247680664e-06, 7.770955562591553e-06, 8.955597877502441e-06, 1.014024019241333e-05, 1.1324882507324219e-05, 1.2509524822235107e-05, 1.3694167137145996e-05, 1.4878809452056885e-05, 1.6063451766967773e-05, 1.7248094081878662e-05, 1.843273639678955e-05, 1.961737871170044e-05, 2.0802021026611328e-05, 2.1986663341522217e-05, 2.3171305656433105e-05, 2.4355947971343994e-05, 2.5540590286254883e-05, 2.672523260116577e-05, 2.790987491607666e-05, 2.909451723098755e-05, 3.0279159545898438e-05]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 4.0, 3.0, 9.0, 9.0, 13.0, 25.0, 34.0, 42.0, 81.0, 88.0, 149.0, 282.0, 426.0, 941.0, 1921.0, 4753.0, 13187.0, 43405.0, 157966.0, 396853.0, 297443.0, 90721.0, 25866.0, 8244.0, 3096.0, 1378.0, 664.0, 349.0, 195.0, 150.0, 76.0, 61.0, 36.0, 24.0, 17.0, 11.0, 8.0, 10.0, 2.0, 4.0, 3.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.04205322265625, -0.04064130783081055, -0.039229393005371094, -0.03781747817993164, -0.03640556335449219, -0.034993648529052734, -0.03358173370361328, -0.03216981887817383, -0.030757904052734375, -0.029345989227294922, -0.02793407440185547, -0.026522159576416016, -0.025110244750976562, -0.02369832992553711, -0.022286415100097656, -0.020874500274658203, -0.01946258544921875, -0.018050670623779297, -0.016638755798339844, -0.01522684097290039, -0.013814926147460938, -0.012403011322021484, -0.010991096496582031, -0.009579181671142578, -0.008167266845703125, -0.006755352020263672, -0.005343437194824219, -0.003931522369384766, -0.0025196075439453125, -0.0011076927185058594, 0.00030422210693359375, 0.0017161369323730469, 0.0031280517578125, 0.004539966583251953, 0.005951881408691406, 0.007363796234130859, 0.008775711059570312, 0.010187625885009766, 0.011599540710449219, 0.013011455535888672, 0.014423370361328125, 0.015835285186767578, 0.01724720001220703, 0.018659114837646484, 0.020071029663085938, 0.02148294448852539, 0.022894859313964844, 0.024306774139404297, 0.02571868896484375, 0.027130603790283203, 0.028542518615722656, 0.02995443344116211, 0.03136634826660156, 0.032778263092041016, 0.03419017791748047, 0.03560209274291992, 0.037014007568359375, 0.03842592239379883, 0.03983783721923828, 0.041249752044677734, 0.04266166687011719, 0.04407358169555664, 0.045485496520996094, 0.04689741134643555, 0.048309326171875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 2.0, 5.0, 3.0, 9.0, 12.0, 16.0, 23.0, 19.0, 16.0, 35.0, 40.0, 56.0, 58.0, 83.0, 66.0, 86.0, 69.0, 65.0, 60.0, 61.0, 53.0, 41.0, 28.0, 22.0, 17.0, 11.0, 8.0, 5.0, 7.0, 8.0, 0.0, 4.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.014617919921875, -0.01419830322265625, -0.0137786865234375, -0.01335906982421875, -0.012939453125, -0.01251983642578125, -0.0121002197265625, -0.01168060302734375, -0.011260986328125, -0.01084136962890625, -0.0104217529296875, -0.01000213623046875, -0.00958251953125, -0.00916290283203125, -0.0087432861328125, -0.00832366943359375, -0.007904052734375, -0.00748443603515625, -0.0070648193359375, -0.00664520263671875, -0.0062255859375, -0.00580596923828125, -0.0053863525390625, -0.00496673583984375, -0.004547119140625, -0.00412750244140625, -0.0037078857421875, -0.00328826904296875, -0.00286865234375, -0.00244903564453125, -0.0020294189453125, -0.00160980224609375, -0.001190185546875, -0.00077056884765625, -0.0003509521484375, 6.866455078125e-05, 0.00048828125, 0.00090789794921875, 0.0013275146484375, 0.00174713134765625, 0.002166748046875, 0.00258636474609375, 0.0030059814453125, 0.00342559814453125, 0.00384521484375, 0.00426483154296875, 0.0046844482421875, 0.00510406494140625, 0.005523681640625, 0.00594329833984375, 0.0063629150390625, 0.00678253173828125, 0.0072021484375, 0.00762176513671875, 0.0080413818359375, 0.00846099853515625, 0.008880615234375, 0.00930023193359375, 0.0097198486328125, 0.01013946533203125, 0.01055908203125, 0.01097869873046875, 0.0113983154296875, 0.01181793212890625, 0.012237548828125]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 8.0, 15.0, 38.0, 84.0, 152.0, 198.0, 176.0, 159.0, 104.0, 28.0, 26.0, 5.0, 6.0, 4.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.076685905456543, -4.9233880043029785, -4.770089626312256, -4.616791725158691, -4.463493347167969, -4.310195446014404, -4.15689754486084, -4.003599166870117, -3.8503012657165527, -3.697003126144409, -3.5437049865722656, -3.390407085418701, -3.2371089458465576, -3.083810806274414, -2.9305129051208496, -2.777214765548706, -2.6239166259765625, -2.470618486404419, -2.3173203468322754, -2.164022445678711, -2.0107243061065674, -1.8574261665344238, -1.7041281461715698, -1.5508301258087158, -1.3975319862365723, -1.2442338466644287, -1.0909358263015747, -0.9376377463340759, -0.7843396663665771, -0.6310415863990784, -0.4777435064315796, -0.3244454860687256, -0.17114734649658203, -0.017849266529083252, 0.13544881343841553, 0.2887468934059143, 0.4420449733734131, 0.5953430533409119, 0.7486411333084106, 0.9019391536712646, 1.0552372932434082, 1.2085354328155518, 1.3618334531784058, 1.5151314735412598, 1.6684296131134033, 1.8217277526855469, 1.9750257730484009, 2.128323793411255, 2.2816219329833984, 2.434920072555542, 2.5882182121276855, 2.74151611328125, 2.8948142528533936, 3.048112392425537, 3.2014102935791016, 3.354708433151245, 3.5080065727233887, 3.6613047122955322, 3.814602851867676, 3.9679007530212402, 4.121198654174805, 4.274497032165527, 4.427794933319092, 4.581092834472656, 4.734391212463379]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 5.0, 4.0, 5.0, 4.0, 4.0, 10.0, 15.0, 10.0, 17.0, 14.0, 24.0, 31.0, 36.0, 39.0, 41.0, 46.0, 44.0, 56.0, 58.0, 60.0, 47.0, 73.0, 59.0, 35.0, 48.0, 36.0, 31.0, 29.0, 26.0, 24.0, 16.0, 12.0, 8.0, 8.0, 9.0, 5.0, 9.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.5080432891845703, -1.4532721042633057, -1.398500919342041, -1.3437297344207764, -1.2889585494995117, -1.234187364578247, -1.1794160604476929, -1.1246448755264282, -1.0698736906051636, -1.015102505683899, -0.9603313207626343, -0.9055600762367249, -0.8507888913154602, -0.7960177063941956, -0.7412464618682861, -0.6864752769470215, -0.6317040920257568, -0.5769329071044922, -0.5221617221832275, -0.4673904776573181, -0.41261929273605347, -0.3578481078147888, -0.3030768930912018, -0.24830567836761475, -0.1935344934463501, -0.13876329362392426, -0.08399209380149841, -0.02922089397907257, 0.02555030584335327, 0.08032149076461792, 0.13509270548820496, 0.189863920211792, 0.24463510513305664, 0.2994062900543213, 0.3541775047779083, 0.40894871950149536, 0.46371990442276, 0.5184910893440247, 0.5732623338699341, 0.6280335187911987, 0.6828047037124634, 0.737575888633728, 0.7923470735549927, 0.8471183180809021, 0.9018895030021667, 0.9566606879234314, 1.0114319324493408, 1.0662031173706055, 1.1209743022918701, 1.1757454872131348, 1.2305166721343994, 1.285287857055664, 1.3400590419769287, 1.3948302268981934, 1.4496015310287476, 1.5043727159500122, 1.5591439008712769, 1.6139150857925415, 1.6686862707138062, 1.7234574556350708, 1.778228759765625, 1.8329999446868896, 1.8877711296081543, 1.942542314529419, 1.9973134994506836]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 2.0, 1.0, 4.0, 4.0, 6.0, 9.0, 12.0, 12.0, 18.0, 25.0, 34.0, 60.0, 85.0, 182.0, 364.0, 799.0, 2041.0, 6928.0, 27566.0, 143249.0, 701292.0, 130325.0, 25625.0, 6441.0, 1952.0, 726.0, 325.0, 189.0, 108.0, 61.0, 30.0, 27.0, 17.0, 12.0, 8.0, 6.0, 8.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.87109375, -2.7901611328125, -2.709228515625, -2.6282958984375, -2.54736328125, -2.4664306640625, -2.385498046875, -2.3045654296875, -2.2236328125, -2.1427001953125, -2.061767578125, -1.9808349609375, -1.89990234375, -1.8189697265625, -1.738037109375, -1.6571044921875, -1.576171875, -1.4952392578125, -1.414306640625, -1.3333740234375, -1.25244140625, -1.1715087890625, -1.090576171875, -1.0096435546875, -0.9287109375, -0.8477783203125, -0.766845703125, -0.6859130859375, -0.60498046875, -0.5240478515625, -0.443115234375, -0.3621826171875, -0.28125, -0.2003173828125, -0.119384765625, -0.0384521484375, 0.04248046875, 0.1234130859375, 0.204345703125, 0.2852783203125, 0.3662109375, 0.4471435546875, 0.528076171875, 0.6090087890625, 0.68994140625, 0.7708740234375, 0.851806640625, 0.9327392578125, 1.013671875, 1.0946044921875, 1.175537109375, 1.2564697265625, 1.33740234375, 1.4183349609375, 1.499267578125, 1.5802001953125, 1.6611328125, 1.7420654296875, 1.822998046875, 1.9039306640625, 1.98486328125, 2.0657958984375, 2.146728515625, 2.2276611328125, 2.30859375]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 6.0, 10.0, 8.0, 8.0, 7.0, 19.0, 14.0, 10.0, 28.0, 24.0, 29.0, 33.0, 47.0, 37.0, 44.0, 48.0, 54.0, 67.0, 49.0, 55.0, 49.0, 49.0, 46.0, 37.0, 44.0, 27.0, 27.0, 30.0, 10.0, 23.0, 17.0, 13.0, 7.0, 9.0, 6.0, 7.0, 2.0, 5.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.91015625, -2.803558349609375, -2.69696044921875, -2.590362548828125, -2.4837646484375, -2.377166748046875, -2.27056884765625, -2.163970947265625, -2.057373046875, -1.950775146484375, -1.84417724609375, -1.737579345703125, -1.6309814453125, -1.524383544921875, -1.41778564453125, -1.311187744140625, -1.20458984375, -1.097991943359375, -0.99139404296875, -0.884796142578125, -0.7781982421875, -0.671600341796875, -0.56500244140625, -0.458404541015625, -0.351806640625, -0.245208740234375, -0.13861083984375, -0.032012939453125, 0.0745849609375, 0.181182861328125, 0.28778076171875, 0.394378662109375, 0.5009765625, 0.607574462890625, 0.71417236328125, 0.820770263671875, 0.9273681640625, 1.033966064453125, 1.14056396484375, 1.247161865234375, 1.353759765625, 1.460357666015625, 1.56695556640625, 1.673553466796875, 1.7801513671875, 1.886749267578125, 1.99334716796875, 2.099945068359375, 2.20654296875, 2.313140869140625, 2.41973876953125, 2.526336669921875, 2.6329345703125, 2.739532470703125, 2.84613037109375, 2.952728271484375, 3.059326171875, 3.165924072265625, 3.27252197265625, 3.379119873046875, 3.4857177734375, 3.592315673828125, 3.69891357421875, 3.805511474609375, 3.912109375]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 5.0, 2.0, 5.0, 9.0, 12.0, 7.0, 23.0, 26.0, 26.0, 35.0, 50.0, 84.0, 85.0, 148.0, 201.0, 297.0, 526.0, 1388.0, 11388.0, 460406.0, 558440.0, 12294.0, 1496.0, 538.0, 291.0, 206.0, 159.0, 98.0, 78.0, 45.0, 42.0, 41.0, 22.0, 21.0, 16.0, 14.0, 5.0, 10.0, 8.0, 3.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.625, -5.46435546875, -5.3037109375, -5.14306640625, -4.982421875, -4.82177734375, -4.6611328125, -4.50048828125, -4.33984375, -4.17919921875, -4.0185546875, -3.85791015625, -3.697265625, -3.53662109375, -3.3759765625, -3.21533203125, -3.0546875, -2.89404296875, -2.7333984375, -2.57275390625, -2.412109375, -2.25146484375, -2.0908203125, -1.93017578125, -1.76953125, -1.60888671875, -1.4482421875, -1.28759765625, -1.126953125, -0.96630859375, -0.8056640625, -0.64501953125, -0.484375, -0.32373046875, -0.1630859375, -0.00244140625, 0.158203125, 0.31884765625, 0.4794921875, 0.64013671875, 0.80078125, 0.96142578125, 1.1220703125, 1.28271484375, 1.443359375, 1.60400390625, 1.7646484375, 1.92529296875, 2.0859375, 2.24658203125, 2.4072265625, 2.56787109375, 2.728515625, 2.88916015625, 3.0498046875, 3.21044921875, 3.37109375, 3.53173828125, 3.6923828125, 3.85302734375, 4.013671875, 4.17431640625, 4.3349609375, 4.49560546875, 4.65625]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 8.0, 5.0, 5.0, 6.0, 4.0, 3.0, 9.0, 11.0, 10.0, 17.0, 17.0, 10.0, 18.0, 18.0, 38.0, 27.0, 39.0, 41.0, 39.0, 47.0, 61.0, 57.0, 60.0, 49.0, 54.0, 44.0, 33.0, 37.0, 34.0, 24.0, 28.0, 26.0, 19.0, 19.0, 18.0, 12.0, 10.0, 11.0, 13.0, 9.0, 7.0, 3.0, 1.0, 4.0, 2.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.90234375, -3.784698486328125, -3.66705322265625, -3.549407958984375, -3.4317626953125, -3.314117431640625, -3.19647216796875, -3.078826904296875, -2.961181640625, -2.843536376953125, -2.72589111328125, -2.608245849609375, -2.4906005859375, -2.372955322265625, -2.25531005859375, -2.137664794921875, -2.02001953125, -1.902374267578125, -1.78472900390625, -1.667083740234375, -1.5494384765625, -1.431793212890625, -1.31414794921875, -1.196502685546875, -1.078857421875, -0.961212158203125, -0.84356689453125, -0.725921630859375, -0.6082763671875, -0.490631103515625, -0.37298583984375, -0.255340576171875, -0.1376953125, -0.020050048828125, 0.09759521484375, 0.215240478515625, 0.3328857421875, 0.450531005859375, 0.56817626953125, 0.685821533203125, 0.803466796875, 0.921112060546875, 1.03875732421875, 1.156402587890625, 1.2740478515625, 1.391693115234375, 1.50933837890625, 1.626983642578125, 1.74462890625, 1.862274169921875, 1.97991943359375, 2.097564697265625, 2.2152099609375, 2.332855224609375, 2.45050048828125, 2.568145751953125, 2.685791015625, 2.803436279296875, 2.92108154296875, 3.038726806640625, 3.1563720703125, 3.274017333984375, 3.39166259765625, 3.509307861328125, 3.626953125]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 7.0, 3.0, 19.0, 25.0, 76.0, 152.0, 382.0, 968.0, 7065.0, 1010370.0, 27230.0, 1484.0, 458.0, 167.0, 78.0, 26.0, 12.0, 6.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.169921875, -3.050933837890625, -2.93194580078125, -2.812957763671875, -2.6939697265625, -2.574981689453125, -2.45599365234375, -2.337005615234375, -2.218017578125, -2.099029541015625, -1.98004150390625, -1.861053466796875, -1.7420654296875, -1.623077392578125, -1.50408935546875, -1.385101318359375, -1.26611328125, -1.147125244140625, -1.02813720703125, -0.909149169921875, -0.7901611328125, -0.671173095703125, -0.55218505859375, -0.433197021484375, -0.314208984375, -0.195220947265625, -0.07623291015625, 0.042755126953125, 0.1617431640625, 0.280731201171875, 0.39971923828125, 0.518707275390625, 0.6376953125, 0.756683349609375, 0.87567138671875, 0.994659423828125, 1.1136474609375, 1.232635498046875, 1.35162353515625, 1.470611572265625, 1.589599609375, 1.708587646484375, 1.82757568359375, 1.946563720703125, 2.0655517578125, 2.184539794921875, 2.30352783203125, 2.422515869140625, 2.54150390625, 2.660491943359375, 2.77947998046875, 2.898468017578125, 3.0174560546875, 3.136444091796875, 3.25543212890625, 3.374420166015625, 3.493408203125, 3.612396240234375, 3.73138427734375, 3.850372314453125, 3.9693603515625, 4.088348388671875, 4.20733642578125, 4.326324462890625, 4.4453125]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 9.0, 11.0, 8.0, 19.0, 21.0, 32.0, 46.0, 83.0, 174.0, 302.0, 100.0, 61.0, 43.0, 26.0, 28.0, 10.0, 15.0, 7.0, 3.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0002713203430175781, -0.00026402994990348816, -0.0002567395567893982, -0.00024944916367530823, -0.00024215877056121826, -0.0002348683774471283, -0.00022757798433303833, -0.00022028759121894836, -0.0002129971981048584, -0.00020570680499076843, -0.00019841641187667847, -0.0001911260187625885, -0.00018383562564849854, -0.00017654523253440857, -0.0001692548394203186, -0.00016196444630622864, -0.00015467405319213867, -0.0001473836600780487, -0.00014009326696395874, -0.00013280287384986877, -0.0001255124807357788, -0.00011822208762168884, -0.00011093169450759888, -0.00010364130139350891, -9.635090827941895e-05, -8.906051516532898e-05, -8.177012205123901e-05, -7.447972893714905e-05, -6.718933582305908e-05, -5.9898942708969116e-05, -5.260854959487915e-05, -4.5318156480789185e-05, -3.802776336669922e-05, -3.073737025260925e-05, -2.3446977138519287e-05, -1.615658402442932e-05, -8.866190910339355e-06, -1.5757977962493896e-06, 5.714595317840576e-06, 1.3004988431930542e-05, 2.0295381546020508e-05, 2.7585774660110474e-05, 3.487616777420044e-05, 4.2166560888290405e-05, 4.945695400238037e-05, 5.674734711647034e-05, 6.40377402305603e-05, 7.132813334465027e-05, 7.861852645874023e-05, 8.59089195728302e-05, 9.319931268692017e-05, 0.00010048970580101013, 0.0001077800989151001, 0.00011507049202919006, 0.00012236088514328003, 0.00012965127825737, 0.00013694167137145996, 0.00014423206448554993, 0.0001515224575996399, 0.00015881285071372986, 0.00016610324382781982, 0.0001733936369419098, 0.00018068403005599976, 0.00018797442317008972, 0.0001952648162841797]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 6.0, 17.0, 12.0, 30.0, 55.0, 103.0, 229.0, 482.0, 1334.0, 18131.0, 1011387.0, 14615.0, 1215.0, 495.0, 198.0, 101.0, 63.0, 32.0, 18.0, 12.0, 9.0, 1.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.18359375, -4.062255859375, -3.94091796875, -3.819580078125, -3.6982421875, -3.576904296875, -3.45556640625, -3.334228515625, -3.212890625, -3.091552734375, -2.97021484375, -2.848876953125, -2.7275390625, -2.606201171875, -2.48486328125, -2.363525390625, -2.2421875, -2.120849609375, -1.99951171875, -1.878173828125, -1.7568359375, -1.635498046875, -1.51416015625, -1.392822265625, -1.271484375, -1.150146484375, -1.02880859375, -0.907470703125, -0.7861328125, -0.664794921875, -0.54345703125, -0.422119140625, -0.30078125, -0.179443359375, -0.05810546875, 0.063232421875, 0.1845703125, 0.305908203125, 0.42724609375, 0.548583984375, 0.669921875, 0.791259765625, 0.91259765625, 1.033935546875, 1.1552734375, 1.276611328125, 1.39794921875, 1.519287109375, 1.640625, 1.761962890625, 1.88330078125, 2.004638671875, 2.1259765625, 2.247314453125, 2.36865234375, 2.489990234375, 2.611328125, 2.732666015625, 2.85400390625, 2.975341796875, 3.0966796875, 3.218017578125, 3.33935546875, 3.460693359375, 3.58203125]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 6.0, 10.0, 33.0, 51.0, 89.0, 383.0, 279.0, 89.0, 39.0, 16.0, 9.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9375, -0.8998260498046875, -0.862152099609375, -0.8244781494140625, -0.78680419921875, -0.7491302490234375, -0.711456298828125, -0.6737823486328125, -0.6361083984375, -0.5984344482421875, -0.560760498046875, -0.5230865478515625, -0.48541259765625, -0.4477386474609375, -0.410064697265625, -0.3723907470703125, -0.334716796875, -0.2970428466796875, -0.259368896484375, -0.2216949462890625, -0.18402099609375, -0.1463470458984375, -0.108673095703125, -0.0709991455078125, -0.0333251953125, 0.0043487548828125, 0.042022705078125, 0.0796966552734375, 0.11737060546875, 0.1550445556640625, 0.192718505859375, 0.2303924560546875, 0.26806640625, 0.3057403564453125, 0.343414306640625, 0.3810882568359375, 0.41876220703125, 0.4564361572265625, 0.494110107421875, 0.5317840576171875, 0.5694580078125, 0.6071319580078125, 0.644805908203125, 0.6824798583984375, 0.72015380859375, 0.7578277587890625, 0.795501708984375, 0.8331756591796875, 0.870849609375, 0.9085235595703125, 0.946197509765625, 0.9838714599609375, 1.02154541015625, 1.0592193603515625, 1.096893310546875, 1.1345672607421875, 1.1722412109375, 1.2099151611328125, 1.247589111328125, 1.2852630615234375, 1.32293701171875, 1.3606109619140625, 1.398284912109375, 1.4359588623046875, 1.4736328125]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 6.0, 8.0, 10.0, 23.0, 31.0, 55.0, 98.0, 110.0, 123.0, 140.0, 127.0, 100.0, 74.0, 34.0, 30.0, 13.0, 10.0, 3.0, 2.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.202199935913086, -7.987643718719482, -7.773087501525879, -7.558531284332275, -7.343975067138672, -7.129419326782227, -6.914863109588623, -6.7003068923950195, -6.485750675201416, -6.2711944580078125, -6.056638240814209, -5.8420820236206055, -5.62752628326416, -5.412969589233398, -5.198413848876953, -4.98385763168335, -4.769301414489746, -4.554745197296143, -4.340188980102539, -4.1256327629089355, -3.911076784133911, -3.6965205669403076, -3.481964588165283, -3.2674083709716797, -3.052852153778076, -2.8382959365844727, -2.623739719390869, -2.4091837406158447, -2.194627523422241, -1.9800713062286377, -1.7655152082443237, -1.5509591102600098, -1.336402416229248, -1.1218461990356445, -0.9072901010513306, -0.6927339434623718, -0.4781777858734131, -0.26362156867980957, -0.049065470695495605, 0.16549062728881836, 0.3800468444824219, 0.5946030020713806, 0.8091591596603394, 1.0237152576446533, 1.2382714748382568, 1.4528276920318604, 1.6673837900161743, 1.8819398880004883, 2.096496105194092, 2.3110523223876953, 2.525608539581299, 2.7401645183563232, 2.9547207355499268, 3.1692769527435303, 3.3838329315185547, 3.598389148712158, 3.8129453659057617, 4.027501583099365, 4.242057800292969, 4.456614017486572, 4.671170234680176, 4.885725975036621, 5.100282192230225, 5.314838409423828, 5.529394626617432]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 8.0, 4.0, 6.0, 13.0, 7.0, 10.0, 7.0, 7.0, 18.0, 12.0, 27.0, 21.0, 29.0, 29.0, 45.0, 32.0, 37.0, 36.0, 40.0, 43.0, 40.0, 43.0, 51.0, 42.0, 39.0, 31.0, 37.0, 37.0, 34.0, 33.0, 24.0, 29.0, 27.0, 24.0, 11.0, 20.0, 11.0, 6.0, 7.0, 7.0, 5.0, 6.0, 4.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.1834845542907715, -5.010655403137207, -4.837826251983643, -4.664997100830078, -4.4921674728393555, -4.319338321685791, -4.146509170532227, -3.973680019378662, -3.8008508682250977, -3.628021717071533, -3.4551925659179688, -3.282363176345825, -3.1095340251922607, -2.9367048740386963, -2.7638754844665527, -2.5910463333129883, -2.418217182159424, -2.2453880310058594, -2.072558879852295, -1.8997294902801514, -1.726900339126587, -1.5540711879730225, -1.3812419176101685, -1.2084126472473145, -1.03558349609375, -0.8627542853355408, -0.6899250745773315, -0.5170958638191223, -0.3442666530609131, -0.17143744230270386, 0.001391768455505371, 0.17422103881835938, 0.34705066680908203, 0.5198798775672913, 0.6927090883255005, 0.8655382990837097, 1.038367509841919, 1.2111966609954834, 1.3840259313583374, 1.5568552017211914, 1.7296843528747559, 1.9025135040283203, 2.0753426551818848, 2.2481720447540283, 2.4210011959075928, 2.5938303470611572, 2.766659736633301, 2.9394888877868652, 3.1123180389404297, 3.285147190093994, 3.4579763412475586, 3.630805730819702, 3.8036348819732666, 3.976464033126831, 4.149293422698975, 4.322122573852539, 4.4949517250061035, 4.667780876159668, 4.840610027313232, 5.013439178466797, 5.1862688064575195, 5.359097957611084, 5.531927108764648, 5.704756259918213, 5.877585411071777]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 5.0, 3.0, 9.0, 13.0, 5.0, 18.0, 27.0, 20.0, 23.0, 27.0, 48.0, 44.0, 79.0, 130.0, 299.0, 1302.0, 72392.0, 4094661.0, 23782.0, 776.0, 223.0, 94.0, 71.0, 43.0, 47.0, 37.0, 21.0, 20.0, 10.0, 14.0, 8.0, 7.0, 6.0, 7.0, 7.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-14.6796875, -14.26513671875, -13.8505859375, -13.43603515625, -13.021484375, -12.60693359375, -12.1923828125, -11.77783203125, -11.36328125, -10.94873046875, -10.5341796875, -10.11962890625, -9.705078125, -9.29052734375, -8.8759765625, -8.46142578125, -8.046875, -7.63232421875, -7.2177734375, -6.80322265625, -6.388671875, -5.97412109375, -5.5595703125, -5.14501953125, -4.73046875, -4.31591796875, -3.9013671875, -3.48681640625, -3.072265625, -2.65771484375, -2.2431640625, -1.82861328125, -1.4140625, -0.99951171875, -0.5849609375, -0.17041015625, 0.244140625, 0.65869140625, 1.0732421875, 1.48779296875, 1.90234375, 2.31689453125, 2.7314453125, 3.14599609375, 3.560546875, 3.97509765625, 4.3896484375, 4.80419921875, 5.21875, 5.63330078125, 6.0478515625, 6.46240234375, 6.876953125, 7.29150390625, 7.7060546875, 8.12060546875, 8.53515625, 8.94970703125, 9.3642578125, 9.77880859375, 10.193359375, 10.60791015625, 11.0224609375, 11.43701171875, 11.8515625]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 2.0, 4.0, 9.0, 10.0, 2.0, 16.0, 17.0, 15.0, 18.0, 21.0, 27.0, 33.0, 38.0, 51.0, 57.0, 54.0, 47.0, 59.0, 59.0, 49.0, 56.0, 60.0, 48.0, 38.0, 37.0, 39.0, 22.0, 14.0, 20.0, 14.0, 15.0, 9.0, 5.0, 13.0, 7.0, 5.0, 5.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.12109375, -2.057586669921875, -1.99407958984375, -1.930572509765625, -1.8670654296875, -1.803558349609375, -1.74005126953125, -1.676544189453125, -1.613037109375, -1.549530029296875, -1.48602294921875, -1.422515869140625, -1.3590087890625, -1.295501708984375, -1.23199462890625, -1.168487548828125, -1.10498046875, -1.041473388671875, -0.97796630859375, -0.914459228515625, -0.8509521484375, -0.787445068359375, -0.72393798828125, -0.660430908203125, -0.596923828125, -0.533416748046875, -0.46990966796875, -0.406402587890625, -0.3428955078125, -0.279388427734375, -0.21588134765625, -0.152374267578125, -0.0888671875, -0.025360107421875, 0.03814697265625, 0.101654052734375, 0.1651611328125, 0.228668212890625, 0.29217529296875, 0.355682373046875, 0.419189453125, 0.482696533203125, 0.54620361328125, 0.609710693359375, 0.6732177734375, 0.736724853515625, 0.80023193359375, 0.863739013671875, 0.92724609375, 0.990753173828125, 1.05426025390625, 1.117767333984375, 1.1812744140625, 1.244781494140625, 1.30828857421875, 1.371795654296875, 1.435302734375, 1.498809814453125, 1.56231689453125, 1.625823974609375, 1.6893310546875, 1.752838134765625, 1.81634521484375, 1.879852294921875, 1.943359375]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 2.0, 4.0, 6.0, 6.0, 9.0, 14.0, 20.0, 36.0, 65.0, 103.0, 203.0, 489.0, 1254.0, 4519.0, 39863.0, 2429501.0, 1681106.0, 31047.0, 4004.0, 1155.0, 413.0, 212.0, 101.0, 51.0, 44.0, 15.0, 11.0, 9.0, 3.0, 6.0, 4.0, 1.0, 4.0, 1.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.82421875, -5.6419677734375, -5.459716796875, -5.2774658203125, -5.09521484375, -4.9129638671875, -4.730712890625, -4.5484619140625, -4.3662109375, -4.1839599609375, -4.001708984375, -3.8194580078125, -3.63720703125, -3.4549560546875, -3.272705078125, -3.0904541015625, -2.908203125, -2.7259521484375, -2.543701171875, -2.3614501953125, -2.17919921875, -1.9969482421875, -1.814697265625, -1.6324462890625, -1.4501953125, -1.2679443359375, -1.085693359375, -0.9034423828125, -0.72119140625, -0.5389404296875, -0.356689453125, -0.1744384765625, 0.0078125, 0.1900634765625, 0.372314453125, 0.5545654296875, 0.73681640625, 0.9190673828125, 1.101318359375, 1.2835693359375, 1.4658203125, 1.6480712890625, 1.830322265625, 2.0125732421875, 2.19482421875, 2.3770751953125, 2.559326171875, 2.7415771484375, 2.923828125, 3.1060791015625, 3.288330078125, 3.4705810546875, 3.65283203125, 3.8350830078125, 4.017333984375, 4.1995849609375, 4.3818359375, 4.5640869140625, 4.746337890625, 4.9285888671875, 5.11083984375, 5.2930908203125, 5.475341796875, 5.6575927734375, 5.83984375]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 7.0, 7.0, 9.0, 25.0, 30.0, 38.0, 66.0, 86.0, 152.0, 218.0, 331.0, 523.0, 651.0, 593.0, 442.0, 302.0, 197.0, 133.0, 88.0, 57.0, 38.0, 18.0, 17.0, 14.0, 10.0, 7.0, 3.0, 4.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1474609375, -1.1125030517578125, -1.077545166015625, -1.0425872802734375, -1.00762939453125, -0.9726715087890625, -0.937713623046875, -0.9027557373046875, -0.8677978515625, -0.8328399658203125, -0.797882080078125, -0.7629241943359375, -0.72796630859375, -0.6930084228515625, -0.658050537109375, -0.6230926513671875, -0.588134765625, -0.5531768798828125, -0.518218994140625, -0.4832611083984375, -0.44830322265625, -0.4133453369140625, -0.378387451171875, -0.3434295654296875, -0.3084716796875, -0.2735137939453125, -0.238555908203125, -0.2035980224609375, -0.16864013671875, -0.1336822509765625, -0.098724365234375, -0.0637664794921875, -0.02880859375, 0.0061492919921875, 0.041107177734375, 0.0760650634765625, 0.11102294921875, 0.1459808349609375, 0.180938720703125, 0.2158966064453125, 0.2508544921875, 0.2858123779296875, 0.320770263671875, 0.3557281494140625, 0.39068603515625, 0.4256439208984375, 0.460601806640625, 0.4955596923828125, 0.530517578125, 0.5654754638671875, 0.600433349609375, 0.6353912353515625, 0.67034912109375, 0.7053070068359375, 0.740264892578125, 0.7752227783203125, 0.8101806640625, 0.8451385498046875, 0.880096435546875, 0.9150543212890625, 0.95001220703125, 0.9849700927734375, 1.019927978515625, 1.0548858642578125, 1.08984375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 6.0, 7.0, 28.0, 39.0, 65.0, 101.0, 137.0, 158.0, 145.0, 111.0, 101.0, 49.0, 34.0, 14.0, 10.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6952319145202637, -3.508453845977783, -3.3216757774353027, -3.134897470474243, -2.9481194019317627, -2.7613413333892822, -2.5745630264282227, -2.387784957885742, -2.2010068893432617, -2.0142288208007812, -1.8274506330490112, -1.6406724452972412, -1.4538943767547607, -1.2671163082122803, -1.0803381204605103, -0.8935599327087402, -0.7067818641662598, -0.5200037360191345, -0.3332256078720093, -0.14644747972488403, 0.04033064842224121, 0.22710877656936646, 0.4138869047164917, 0.6006650924682617, 0.7874431610107422, 0.9742212891578674, 1.1609994173049927, 1.3477776050567627, 1.5345556735992432, 1.7213337421417236, 1.9081119298934937, 2.0948901176452637, 2.281667709350586, 2.4684457778930664, 2.655223846435547, 2.8420021533966064, 3.028780221939087, 3.2155582904815674, 3.402336597442627, 3.5891146659851074, 3.775892734527588, 3.9626708030700684, 4.149448871612549, 4.336226940155029, 4.523005485534668, 4.709783554077148, 4.896561622619629, 5.083339691162109, 5.27011775970459, 5.45689582824707, 5.643673896789551, 5.830451965332031, 6.017230033874512, 6.20400857925415, 6.390786647796631, 6.577564716339111, 6.764342784881592, 6.951120853424072, 7.137898921966553, 7.324676990509033, 7.511455535888672, 7.698233604431152, 7.885011672973633, 8.071789741516113, 8.258567810058594]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 3.0, 5.0, 7.0, 5.0, 8.0, 17.0, 12.0, 12.0, 21.0, 17.0, 25.0, 21.0, 23.0, 30.0, 25.0, 49.0, 55.0, 45.0, 52.0, 43.0, 37.0, 46.0, 50.0, 52.0, 39.0, 46.0, 37.0, 32.0, 36.0, 29.0, 29.0, 25.0, 13.0, 13.0, 8.0, 8.0, 8.0, 8.0, 4.0, 8.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.0219712257385254, -1.9532334804534912, -1.8844958543777466, -1.8157581090927124, -1.7470204830169678, -1.6782827377319336, -1.6095449924468994, -1.5408072471618652, -1.4720696210861206, -1.4033318758010864, -1.3345942497253418, -1.2658565044403076, -1.1971187591552734, -1.1283811330795288, -1.0596433877944946, -0.9909057021141052, -0.9221680164337158, -0.8534303307533264, -0.784692645072937, -0.7159548997879028, -0.6472172141075134, -0.578479528427124, -0.5097417831420898, -0.44100409746170044, -0.37226641178131104, -0.30352872610092163, -0.23479101061820984, -0.16605331003665924, -0.09731560945510864, -0.02857792377471924, 0.040159791707992554, 0.10889750719070435, 0.17763495445251465, 0.24637265503406525, 0.31511035561561584, 0.38384807109832764, 0.45258575677871704, 0.5213234424591064, 0.5900611877441406, 0.65879887342453, 0.7275365591049194, 0.7962742447853088, 0.8650119304656982, 0.9337496757507324, 1.0024874210357666, 1.0712250471115112, 1.1399627923965454, 1.20870041847229, 1.2774381637573242, 1.3461759090423584, 1.414913535118103, 1.4836512804031372, 1.5523889064788818, 1.621126651763916, 1.6898643970489502, 1.7586021423339844, 1.827339768409729, 1.8960775136947632, 1.9648151397705078, 2.033552885055542, 2.102290630340576, 2.1710281372070312, 2.2397658824920654, 2.3085036277770996, 2.377241373062134]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 8.0, 12.0, 14.0, 32.0, 41.0, 66.0, 111.0, 190.0, 331.0, 701.0, 1812.0, 6256.0, 33787.0, 248185.0, 598606.0, 132926.0, 18843.0, 4152.0, 1288.0, 530.0, 272.0, 134.0, 100.0, 53.0, 33.0, 28.0, 20.0, 4.0, 4.0, 3.0, 5.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.86474609375, -0.8342361450195312, -0.8037261962890625, -0.7732162475585938, -0.742706298828125, -0.7121963500976562, -0.6816864013671875, -0.6511764526367188, -0.62066650390625, -0.5901565551757812, -0.5596466064453125, -0.5291366577148438, -0.498626708984375, -0.46811676025390625, -0.4376068115234375, -0.40709686279296875, -0.3765869140625, -0.34607696533203125, -0.3155670166015625, -0.28505706787109375, -0.254547119140625, -0.22403717041015625, -0.1935272216796875, -0.16301727294921875, -0.13250732421875, -0.10199737548828125, -0.0714874267578125, -0.04097747802734375, -0.010467529296875, 0.02004241943359375, 0.0505523681640625, 0.08106231689453125, 0.111572265625, 0.14208221435546875, 0.1725921630859375, 0.20310211181640625, 0.233612060546875, 0.26412200927734375, 0.2946319580078125, 0.32514190673828125, 0.35565185546875, 0.38616180419921875, 0.4166717529296875, 0.44718170166015625, 0.477691650390625, 0.5082015991210938, 0.5387115478515625, 0.5692214965820312, 0.5997314453125, 0.6302413940429688, 0.6607513427734375, 0.6912612915039062, 0.721771240234375, 0.7522811889648438, 0.7827911376953125, 0.8133010864257812, 0.84381103515625, 0.8743209838867188, 0.9048309326171875, 0.9353408813476562, 0.965850830078125, 0.9963607788085938, 1.0268707275390625, 1.0573806762695312, 1.087890625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 4.0, 6.0, 9.0, 10.0, 18.0, 27.0, 21.0, 32.0, 45.0, 45.0, 64.0, 79.0, 70.0, 80.0, 86.0, 65.0, 60.0, 61.0, 70.0, 46.0, 28.0, 21.0, 17.0, 14.0, 15.0, 7.0, 5.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.1328125, -3.054229736328125, -2.97564697265625, -2.897064208984375, -2.8184814453125, -2.739898681640625, -2.66131591796875, -2.582733154296875, -2.504150390625, -2.425567626953125, -2.34698486328125, -2.268402099609375, -2.1898193359375, -2.111236572265625, -2.03265380859375, -1.954071044921875, -1.87548828125, -1.796905517578125, -1.71832275390625, -1.639739990234375, -1.5611572265625, -1.482574462890625, -1.40399169921875, -1.325408935546875, -1.246826171875, -1.168243408203125, -1.08966064453125, -1.011077880859375, -0.9324951171875, -0.853912353515625, -0.77532958984375, -0.696746826171875, -0.6181640625, -0.539581298828125, -0.46099853515625, -0.382415771484375, -0.3038330078125, -0.225250244140625, -0.14666748046875, -0.068084716796875, 0.010498046875, 0.089080810546875, 0.16766357421875, 0.246246337890625, 0.3248291015625, 0.403411865234375, 0.48199462890625, 0.560577392578125, 0.63916015625, 0.717742919921875, 0.79632568359375, 0.874908447265625, 0.9534912109375, 1.032073974609375, 1.11065673828125, 1.189239501953125, 1.267822265625, 1.346405029296875, 1.42498779296875, 1.503570556640625, 1.5821533203125, 1.660736083984375, 1.73931884765625, 1.817901611328125, 1.896484375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 6.0, 10.0, 13.0, 21.0, 39.0, 33.0, 56.0, 95.0, 118.0, 173.0, 256.0, 357.0, 565.0, 843.0, 1262.0, 1876.0, 2722.0, 4250.0, 6307.0, 9607.0, 14447.0, 21771.0, 32311.0, 48222.0, 70842.0, 99730.0, 128798.0, 144234.0, 132018.0, 101849.0, 73226.0, 50424.0, 33735.0, 22576.0, 15534.0, 9932.0, 6742.0, 4385.0, 2963.0, 2028.0, 1306.0, 942.0, 624.0, 412.0, 291.0, 192.0, 141.0, 83.0, 60.0, 43.0, 33.0, 26.0, 13.0, 11.0, 6.0, 2.0, 4.0, 2.0, 2.0, 1.0], "bins": [-0.1531982421875, -0.1483440399169922, -0.14348983764648438, -0.13863563537597656, -0.13378143310546875, -0.12892723083496094, -0.12407302856445312, -0.11921882629394531, -0.1143646240234375, -0.10951042175292969, -0.10465621948242188, -0.09980201721191406, -0.09494781494140625, -0.09009361267089844, -0.08523941040039062, -0.08038520812988281, -0.075531005859375, -0.07067680358886719, -0.06582260131835938, -0.06096839904785156, -0.05611419677734375, -0.05125999450683594, -0.046405792236328125, -0.04155158996582031, -0.0366973876953125, -0.03184318542480469, -0.026988983154296875, -0.022134780883789062, -0.01728057861328125, -0.012426376342773438, -0.007572174072265625, -0.0027179718017578125, 0.00213623046875, 0.0069904327392578125, 0.011844635009765625, 0.016698837280273438, 0.02155303955078125, 0.026407241821289062, 0.031261444091796875, 0.03611564636230469, 0.0409698486328125, 0.04582405090332031, 0.050678253173828125, 0.05553245544433594, 0.06038665771484375, 0.06524085998535156, 0.07009506225585938, 0.07494926452636719, 0.079803466796875, 0.08465766906738281, 0.08951187133789062, 0.09436607360839844, 0.09922027587890625, 0.10407447814941406, 0.10892868041992188, 0.11378288269042969, 0.1186370849609375, 0.12349128723144531, 0.12834548950195312, 0.13319969177246094, 0.13805389404296875, 0.14290809631347656, 0.14776229858398438, 0.1526165008544922, 0.157470703125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [4.0, 4.0, 1.0, 3.0, 2.0, 3.0, 5.0, 3.0, 7.0, 7.0, 8.0, 5.0, 15.0, 13.0, 12.0, 10.0, 21.0, 16.0, 18.0, 24.0, 31.0, 20.0, 40.0, 29.0, 37.0, 54.0, 41.0, 39.0, 47.0, 47.0, 38.0, 34.0, 35.0, 35.0, 33.0, 25.0, 26.0, 11.0, 25.0, 20.0, 16.0, 16.0, 18.0, 13.0, 19.0, 17.0, 13.0, 11.0, 9.0, 8.0, 11.0, 2.0, 4.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 3.0, 0.0, 3.0, 1.0, 1.0], "bins": [-2.3671875, -2.287353515625, -2.20751953125, -2.127685546875, -2.0478515625, -1.968017578125, -1.88818359375, -1.808349609375, -1.728515625, -1.648681640625, -1.56884765625, -1.489013671875, -1.4091796875, -1.329345703125, -1.24951171875, -1.169677734375, -1.08984375, -1.010009765625, -0.93017578125, -0.850341796875, -0.7705078125, -0.690673828125, -0.61083984375, -0.531005859375, -0.451171875, -0.371337890625, -0.29150390625, -0.211669921875, -0.1318359375, -0.052001953125, 0.02783203125, 0.107666015625, 0.1875, 0.267333984375, 0.34716796875, 0.427001953125, 0.5068359375, 0.586669921875, 0.66650390625, 0.746337890625, 0.826171875, 0.906005859375, 0.98583984375, 1.065673828125, 1.1455078125, 1.225341796875, 1.30517578125, 1.385009765625, 1.46484375, 1.544677734375, 1.62451171875, 1.704345703125, 1.7841796875, 1.864013671875, 1.94384765625, 2.023681640625, 2.103515625, 2.183349609375, 2.26318359375, 2.343017578125, 2.4228515625, 2.502685546875, 2.58251953125, 2.662353515625, 2.7421875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 7.0, 11.0, 17.0, 36.0, 41.0, 65.0, 135.0, 178.0, 361.0, 689.0, 1374.0, 3412.0, 10210.0, 37271.0, 154807.0, 441495.0, 293977.0, 75518.0, 19023.0, 5751.0, 2131.0, 899.0, 500.0, 256.0, 157.0, 91.0, 61.0, 24.0, 25.0, 14.0, 6.0, 2.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.053985595703125, -0.052170753479003906, -0.05035591125488281, -0.04854106903076172, -0.046726226806640625, -0.04491138458251953, -0.04309654235839844, -0.041281700134277344, -0.03946685791015625, -0.037652015686035156, -0.03583717346191406, -0.03402233123779297, -0.032207489013671875, -0.03039264678955078, -0.028577804565429688, -0.026762962341308594, -0.0249481201171875, -0.023133277893066406, -0.021318435668945312, -0.01950359344482422, -0.017688751220703125, -0.01587390899658203, -0.014059066772460938, -0.012244224548339844, -0.01042938232421875, -0.008614540100097656, -0.0067996978759765625, -0.004984855651855469, -0.003170013427734375, -0.0013551712036132812, 0.0004596710205078125, 0.0022745132446289062, 0.00408935546875, 0.005904197692871094, 0.0077190399169921875, 0.009533882141113281, 0.011348724365234375, 0.013163566589355469, 0.014978408813476562, 0.016793251037597656, 0.01860809326171875, 0.020422935485839844, 0.022237777709960938, 0.02405261993408203, 0.025867462158203125, 0.02768230438232422, 0.029497146606445312, 0.031311988830566406, 0.0331268310546875, 0.034941673278808594, 0.03675651550292969, 0.03857135772705078, 0.040386199951171875, 0.04220104217529297, 0.04401588439941406, 0.045830726623535156, 0.04764556884765625, 0.049460411071777344, 0.05127525329589844, 0.05309009552001953, 0.054904937744140625, 0.05671977996826172, 0.05853462219238281, 0.060349464416503906, 0.062164306640625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 4.0, 7.0, 12.0, 14.0, 19.0, 28.0, 37.0, 42.0, 53.0, 82.0, 84.0, 112.0, 82.0, 91.0, 84.0, 74.0, 52.0, 39.0, 24.0, 15.0, 12.0, 13.0, 11.0, 2.0, 3.0, 6.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.11732292175293e-05, -2.988334745168686e-05, -2.859346568584442e-05, -2.7303583920001984e-05, -2.6013702154159546e-05, -2.4723820388317108e-05, -2.343393862247467e-05, -2.2144056856632233e-05, -2.0854175090789795e-05, -1.9564293324947357e-05, -1.827441155910492e-05, -1.698452979326248e-05, -1.5694648027420044e-05, -1.4404766261577606e-05, -1.3114884495735168e-05, -1.182500272989273e-05, -1.0535120964050293e-05, -9.245239198207855e-06, -7.955357432365417e-06, -6.66547566652298e-06, -5.375593900680542e-06, -4.085712134838104e-06, -2.7958303689956665e-06, -1.5059486031532288e-06, -2.1606683731079102e-07, 1.0738149285316467e-06, 2.3636966943740845e-06, 3.6535784602165222e-06, 4.94346022605896e-06, 6.233341991901398e-06, 7.5232237577438354e-06, 8.813105523586273e-06, 1.0102987289428711e-05, 1.1392869055271149e-05, 1.2682750821113586e-05, 1.3972632586956024e-05, 1.5262514352798462e-05, 1.65523961186409e-05, 1.7842277884483337e-05, 1.9132159650325775e-05, 2.0422041416168213e-05, 2.171192318201065e-05, 2.300180494785309e-05, 2.4291686713695526e-05, 2.5581568479537964e-05, 2.68714502453804e-05, 2.816133201122284e-05, 2.9451213777065277e-05, 3.0741095542907715e-05, 3.203097730875015e-05, 3.332085907459259e-05, 3.461074084043503e-05, 3.5900622606277466e-05, 3.7190504372119904e-05, 3.848038613796234e-05, 3.977026790380478e-05, 4.106014966964722e-05, 4.2350031435489655e-05, 4.363991320133209e-05, 4.492979496717453e-05, 4.621967673301697e-05, 4.7509558498859406e-05, 4.879944026470184e-05, 5.008932203054428e-05, 5.137920379638672e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 3.0, 8.0, 3.0, 15.0, 15.0, 21.0, 22.0, 33.0, 40.0, 67.0, 127.0, 174.0, 297.0, 609.0, 1213.0, 2811.0, 7912.0, 26809.0, 107771.0, 383912.0, 374547.0, 103296.0, 25736.0, 7666.0, 2903.0, 1157.0, 614.0, 307.0, 157.0, 100.0, 58.0, 44.0, 28.0, 22.0, 18.0, 8.0, 9.0, 5.0, 5.0, 6.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.061126708984375, -0.05932807922363281, -0.057529449462890625, -0.05573081970214844, -0.05393218994140625, -0.05213356018066406, -0.050334930419921875, -0.04853630065917969, -0.0467376708984375, -0.04493904113769531, -0.043140411376953125, -0.04134178161621094, -0.03954315185546875, -0.03774452209472656, -0.035945892333984375, -0.03414726257324219, -0.0323486328125, -0.030550003051757812, -0.028751373291015625, -0.026952743530273438, -0.02515411376953125, -0.023355484008789062, -0.021556854248046875, -0.019758224487304688, -0.0179595947265625, -0.016160964965820312, -0.014362335205078125, -0.012563705444335938, -0.01076507568359375, -0.008966445922851562, -0.007167816162109375, -0.0053691864013671875, -0.003570556640625, -0.0017719268798828125, 2.6702880859375e-05, 0.0018253326416015625, 0.00362396240234375, 0.0054225921630859375, 0.007221221923828125, 0.009019851684570312, 0.0108184814453125, 0.012617111206054688, 0.014415740966796875, 0.016214370727539062, 0.01801300048828125, 0.019811630249023438, 0.021610260009765625, 0.023408889770507812, 0.02520751953125, 0.027006149291992188, 0.028804779052734375, 0.030603408813476562, 0.03240203857421875, 0.03420066833496094, 0.035999298095703125, 0.03779792785644531, 0.0395965576171875, 0.04139518737792969, 0.043193817138671875, 0.04499244689941406, 0.04679107666015625, 0.04858970642089844, 0.050388336181640625, 0.05218696594238281, 0.053985595703125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 3.0, 8.0, 7.0, 9.0, 6.0, 10.0, 23.0, 13.0, 21.0, 25.0, 32.0, 38.0, 45.0, 39.0, 51.0, 51.0, 58.0, 56.0, 66.0, 53.0, 60.0, 55.0, 32.0, 52.0, 33.0, 29.0, 15.0, 25.0, 21.0, 13.0, 8.0, 9.0, 6.0, 2.0, 3.0, 3.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01247406005859375, -0.012079238891601562, -0.011684417724609375, -0.011289596557617188, -0.010894775390625, -0.010499954223632812, -0.010105133056640625, -0.009710311889648438, -0.00931549072265625, -0.008920669555664062, -0.008525848388671875, -0.008131027221679688, -0.0077362060546875, -0.0073413848876953125, -0.006946563720703125, -0.0065517425537109375, -0.00615692138671875, -0.0057621002197265625, -0.005367279052734375, -0.0049724578857421875, -0.00457763671875, -0.0041828155517578125, -0.003787994384765625, -0.0033931732177734375, -0.00299835205078125, -0.0026035308837890625, -0.002208709716796875, -0.0018138885498046875, -0.0014190673828125, -0.0010242462158203125, -0.000629425048828125, -0.0002346038818359375, 0.00016021728515625, 0.0005550384521484375, 0.000949859619140625, 0.0013446807861328125, 0.001739501953125, 0.0021343231201171875, 0.002529144287109375, 0.0029239654541015625, 0.00331878662109375, 0.0037136077880859375, 0.004108428955078125, 0.0045032501220703125, 0.0048980712890625, 0.0052928924560546875, 0.005687713623046875, 0.0060825347900390625, 0.00647735595703125, 0.0068721771240234375, 0.007266998291015625, 0.0076618194580078125, 0.008056640625, 0.008451461791992188, 0.008846282958984375, 0.009241104125976562, 0.00963592529296875, 0.010030746459960938, 0.010425567626953125, 0.010820388793945312, 0.0112152099609375, 0.011610031127929688, 0.012004852294921875, 0.012399673461914062, 0.01279449462890625]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 10.0, 18.0, 34.0, 62.0, 130.0, 143.0, 185.0, 162.0, 126.0, 73.0, 41.0, 12.0, 6.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.458585739135742, -3.3119616508483887, -3.1653378009796143, -3.0187137126922607, -2.8720898628234863, -2.725465774536133, -2.5788416862487793, -2.432217836380005, -2.2855939865112305, -2.138969898223877, -1.9923460483551025, -1.845721960067749, -1.6990981101989746, -1.552474021911621, -1.4058500528335571, -1.2592260837554932, -1.1126019954681396, -0.9659780263900757, -0.8193540573120117, -0.672730028629303, -0.526106059551239, -0.37948209047317505, -0.2328580617904663, -0.08623409271240234, 0.06038987636566162, 0.20701386034488678, 0.35363784432411194, 0.5002618432044983, 0.6468858122825623, 0.7935097813606262, 0.940133810043335, 1.086757779121399, 1.233381748199463, 1.3800057172775269, 1.5266296863555908, 1.6732537746429443, 1.8198776245117188, 1.9665017127990723, 2.113125801086426, 2.2597496509552, 2.4063735008239746, 2.552997589111328, 2.6996214389801025, 2.846245527267456, 2.9928693771362305, 3.139493465423584, 3.2861175537109375, 3.432741403579712, 3.5793654918670654, 3.725989580154419, 3.8726134300231934, 4.019237518310547, 4.1658616065979, 4.312485218048096, 4.459109306335449, 4.605733394622803, 4.752357482910156, 4.89898157119751, 5.045605659484863, 5.192229270935059, 5.338853359222412, 5.485477447509766, 5.632101535797119, 5.778725624084473, 5.925349235534668]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 7.0, 10.0, 27.0, 25.0, 31.0, 37.0, 46.0, 61.0, 91.0, 89.0, 71.0, 82.0, 88.0, 75.0, 64.0, 60.0, 45.0, 31.0, 18.0, 17.0, 9.0, 12.0, 4.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.437211513519287, -3.353278160095215, -3.2693448066711426, -3.1854114532470703, -3.101478099822998, -3.017544746398926, -2.9336113929748535, -2.8496780395507812, -2.765744686126709, -2.6818113327026367, -2.5978779792785645, -2.513944625854492, -2.43001127243042, -2.3460779190063477, -2.2621445655822754, -2.178211212158203, -2.0942776203155518, -2.0103442668914795, -1.9264109134674072, -1.842477560043335, -1.7585442066192627, -1.6746108531951904, -1.5906773805618286, -1.5067440271377563, -1.422810673713684, -1.3388773202896118, -1.2549439668655396, -1.1710104942321777, -1.0870771408081055, -1.0031437873840332, -0.9192104339599609, -0.8352770805358887, -0.7513439655303955, -0.6674106121063232, -0.583477258682251, -0.49954384565353394, -0.41561049222946167, -0.3316771388053894, -0.24774372577667236, -0.1638103723526001, -0.07987701892852783, 0.0040563493967056274, 0.08798971772193909, 0.17192310094833374, 0.255856454372406, 0.33978980779647827, 0.4237232208251953, 0.5076565742492676, 0.5915899276733398, 0.6755232810974121, 0.7594566345214844, 0.8433900475502014, 0.9273234009742737, 1.0112566947937012, 1.095190167427063, 1.1791235208511353, 1.2630568742752075, 1.3469902276992798, 1.430923581123352, 1.5148570537567139, 1.5987904071807861, 1.6827237606048584, 1.7666571140289307, 1.850590467453003, 1.9345238208770752]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 2.0, 3.0, 7.0, 6.0, 5.0, 7.0, 4.0, 8.0, 16.0, 28.0, 27.0, 54.0, 86.0, 151.0, 257.0, 573.0, 1284.0, 3409.0, 10156.0, 34169.0, 143262.0, 628872.0, 170017.0, 38548.0, 11248.0, 3705.0, 1407.0, 549.0, 278.0, 152.0, 94.0, 44.0, 41.0, 30.0, 16.0, 14.0, 9.0, 4.0, 2.0, 2.0, 4.0, 0.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.400390625, -2.31915283203125, -2.2379150390625, -2.15667724609375, -2.075439453125, -1.99420166015625, -1.9129638671875, -1.83172607421875, -1.75048828125, -1.66925048828125, -1.5880126953125, -1.50677490234375, -1.425537109375, -1.34429931640625, -1.2630615234375, -1.18182373046875, -1.1005859375, -1.01934814453125, -0.9381103515625, -0.85687255859375, -0.775634765625, -0.69439697265625, -0.6131591796875, -0.53192138671875, -0.45068359375, -0.36944580078125, -0.2882080078125, -0.20697021484375, -0.125732421875, -0.04449462890625, 0.0367431640625, 0.11798095703125, 0.19921875, 0.28045654296875, 0.3616943359375, 0.44293212890625, 0.524169921875, 0.60540771484375, 0.6866455078125, 0.76788330078125, 0.84912109375, 0.93035888671875, 1.0115966796875, 1.09283447265625, 1.174072265625, 1.25531005859375, 1.3365478515625, 1.41778564453125, 1.4990234375, 1.58026123046875, 1.6614990234375, 1.74273681640625, 1.823974609375, 1.90521240234375, 1.9864501953125, 2.06768798828125, 2.14892578125, 2.23016357421875, 2.3114013671875, 2.39263916015625, 2.473876953125, 2.55511474609375, 2.6363525390625, 2.71759033203125, 2.798828125]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 6.0, 0.0, 5.0, 2.0, 5.0, 11.0, 12.0, 18.0, 22.0, 21.0, 18.0, 26.0, 35.0, 27.0, 41.0, 37.0, 59.0, 45.0, 64.0, 48.0, 60.0, 57.0, 53.0, 50.0, 44.0, 35.0, 35.0, 42.0, 26.0, 24.0, 18.0, 10.0, 13.0, 9.0, 7.0, 5.0, 6.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.697265625, -2.600738525390625, -2.50421142578125, -2.407684326171875, -2.3111572265625, -2.214630126953125, -2.11810302734375, -2.021575927734375, -1.925048828125, -1.828521728515625, -1.73199462890625, -1.635467529296875, -1.5389404296875, -1.442413330078125, -1.34588623046875, -1.249359130859375, -1.15283203125, -1.056304931640625, -0.95977783203125, -0.863250732421875, -0.7667236328125, -0.670196533203125, -0.57366943359375, -0.477142333984375, -0.380615234375, -0.284088134765625, -0.18756103515625, -0.091033935546875, 0.0054931640625, 0.102020263671875, 0.19854736328125, 0.295074462890625, 0.3916015625, 0.488128662109375, 0.58465576171875, 0.681182861328125, 0.7777099609375, 0.874237060546875, 0.97076416015625, 1.067291259765625, 1.163818359375, 1.260345458984375, 1.35687255859375, 1.453399658203125, 1.5499267578125, 1.646453857421875, 1.74298095703125, 1.839508056640625, 1.93603515625, 2.032562255859375, 2.12908935546875, 2.225616455078125, 2.3221435546875, 2.418670654296875, 2.51519775390625, 2.611724853515625, 2.708251953125, 2.804779052734375, 2.90130615234375, 2.997833251953125, 3.0943603515625, 3.190887451171875, 3.28741455078125, 3.383941650390625, 3.48046875]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 6.0, 14.0, 16.0, 27.0, 24.0, 46.0, 60.0, 78.0, 147.0, 244.0, 475.0, 1553.0, 20636.0, 886914.0, 132380.0, 4402.0, 745.0, 291.0, 170.0, 106.0, 67.0, 46.0, 28.0, 26.0, 19.0, 11.0, 8.0, 10.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.69140625, -5.47857666015625, -5.2657470703125, -5.05291748046875, -4.840087890625, -4.62725830078125, -4.4144287109375, -4.20159912109375, -3.98876953125, -3.77593994140625, -3.5631103515625, -3.35028076171875, -3.137451171875, -2.92462158203125, -2.7117919921875, -2.49896240234375, -2.2861328125, -2.07330322265625, -1.8604736328125, -1.64764404296875, -1.434814453125, -1.22198486328125, -1.0091552734375, -0.79632568359375, -0.58349609375, -0.37066650390625, -0.1578369140625, 0.05499267578125, 0.267822265625, 0.48065185546875, 0.6934814453125, 0.90631103515625, 1.119140625, 1.33197021484375, 1.5447998046875, 1.75762939453125, 1.970458984375, 2.18328857421875, 2.3961181640625, 2.60894775390625, 2.82177734375, 3.03460693359375, 3.2474365234375, 3.46026611328125, 3.673095703125, 3.88592529296875, 4.0987548828125, 4.31158447265625, 4.5244140625, 4.73724365234375, 4.9500732421875, 5.16290283203125, 5.375732421875, 5.58856201171875, 5.8013916015625, 6.01422119140625, 6.22705078125, 6.43988037109375, 6.6527099609375, 6.86553955078125, 7.078369140625, 7.29119873046875, 7.5040283203125, 7.71685791015625, 7.9296875]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 3.0, 2.0, 4.0, 5.0, 10.0, 8.0, 13.0, 16.0, 19.0, 22.0, 29.0, 34.0, 36.0, 43.0, 53.0, 40.0, 58.0, 65.0, 64.0, 49.0, 64.0, 50.0, 44.0, 34.0, 47.0, 36.0, 29.0, 29.0, 25.0, 10.0, 17.0, 10.0, 18.0, 5.0, 3.0, 5.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-4.5859375, -4.46826171875, -4.3505859375, -4.23291015625, -4.115234375, -3.99755859375, -3.8798828125, -3.76220703125, -3.64453125, -3.52685546875, -3.4091796875, -3.29150390625, -3.173828125, -3.05615234375, -2.9384765625, -2.82080078125, -2.703125, -2.58544921875, -2.4677734375, -2.35009765625, -2.232421875, -2.11474609375, -1.9970703125, -1.87939453125, -1.76171875, -1.64404296875, -1.5263671875, -1.40869140625, -1.291015625, -1.17333984375, -1.0556640625, -0.93798828125, -0.8203125, -0.70263671875, -0.5849609375, -0.46728515625, -0.349609375, -0.23193359375, -0.1142578125, 0.00341796875, 0.12109375, 0.23876953125, 0.3564453125, 0.47412109375, 0.591796875, 0.70947265625, 0.8271484375, 0.94482421875, 1.0625, 1.18017578125, 1.2978515625, 1.41552734375, 1.533203125, 1.65087890625, 1.7685546875, 1.88623046875, 2.00390625, 2.12158203125, 2.2392578125, 2.35693359375, 2.474609375, 2.59228515625, 2.7099609375, 2.82763671875, 2.9453125]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 3.0, 5.0, 9.0, 18.0, 13.0, 33.0, 37.0, 69.0, 129.0, 294.0, 790.0, 3028.0, 37705.0, 901938.0, 97670.0, 5018.0, 1077.0, 341.0, 154.0, 82.0, 51.0, 27.0, 18.0, 17.0, 5.0, 6.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.765625, -1.70172119140625, -1.6378173828125, -1.57391357421875, -1.510009765625, -1.44610595703125, -1.3822021484375, -1.31829833984375, -1.25439453125, -1.19049072265625, -1.1265869140625, -1.06268310546875, -0.998779296875, -0.93487548828125, -0.8709716796875, -0.80706787109375, -0.7431640625, -0.67926025390625, -0.6153564453125, -0.55145263671875, -0.487548828125, -0.42364501953125, -0.3597412109375, -0.29583740234375, -0.23193359375, -0.16802978515625, -0.1041259765625, -0.04022216796875, 0.023681640625, 0.08758544921875, 0.1514892578125, 0.21539306640625, 0.279296875, 0.34320068359375, 0.4071044921875, 0.47100830078125, 0.534912109375, 0.59881591796875, 0.6627197265625, 0.72662353515625, 0.79052734375, 0.85443115234375, 0.9183349609375, 0.98223876953125, 1.046142578125, 1.11004638671875, 1.1739501953125, 1.23785400390625, 1.3017578125, 1.36566162109375, 1.4295654296875, 1.49346923828125, 1.557373046875, 1.62127685546875, 1.6851806640625, 1.74908447265625, 1.81298828125, 1.87689208984375, 1.9407958984375, 2.00469970703125, 2.068603515625, 2.13250732421875, 2.1964111328125, 2.26031494140625, 2.32421875]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 6.0, 7.0, 10.0, 12.0, 23.0, 44.0, 37.0, 73.0, 119.0, 199.0, 171.0, 95.0, 69.0, 30.0, 31.0, 21.0, 18.0, 15.0, 4.0, 8.0, 5.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00020563602447509766, -0.00019852258265018463, -0.0001914091408252716, -0.00018429569900035858, -0.00017718225717544556, -0.00017006881535053253, -0.0001629553735256195, -0.00015584193170070648, -0.00014872848987579346, -0.00014161504805088043, -0.0001345016062259674, -0.00012738816440105438, -0.00012027472257614136, -0.00011316128075122833, -0.00010604783892631531, -9.893439710140228e-05, -9.182095527648926e-05, -8.470751345157623e-05, -7.759407162666321e-05, -7.048062980175018e-05, -6.336718797683716e-05, -5.625374615192413e-05, -4.914030432701111e-05, -4.2026862502098083e-05, -3.491342067718506e-05, -2.7799978852272034e-05, -2.068653702735901e-05, -1.3573095202445984e-05, -6.459653377532959e-06, 6.537884473800659e-07, 7.76723027229309e-06, 1.4880672097206116e-05, 2.199411392211914e-05, 2.9107555747032166e-05, 3.622099757194519e-05, 4.3334439396858215e-05, 5.044788122177124e-05, 5.7561323046684265e-05, 6.467476487159729e-05, 7.178820669651031e-05, 7.890164852142334e-05, 8.601509034633636e-05, 9.312853217124939e-05, 0.00010024197399616241, 0.00010735541582107544, 0.00011446885764598846, 0.00012158229947090149, 0.00012869574129581451, 0.00013580918312072754, 0.00014292262494564056, 0.0001500360667705536, 0.00015714950859546661, 0.00016426295042037964, 0.00017137639224529266, 0.0001784898340702057, 0.0001856032758951187, 0.00019271671772003174, 0.00019983015954494476, 0.0002069436013698578, 0.0002140570431947708, 0.00022117048501968384, 0.00022828392684459686, 0.0002353973686695099, 0.0002425108104944229, 0.00024962425231933594]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 3.0, 8.0, 10.0, 38.0, 35.0, 66.0, 138.0, 266.0, 560.0, 1428.0, 5026.0, 52187.0, 866079.0, 112071.0, 7546.0, 1830.0, 633.0, 305.0, 129.0, 85.0, 44.0, 22.0, 12.0, 7.0, 6.0, 8.0, 0.0, 2.0, 3.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.7255859375, -1.6631011962890625, -1.600616455078125, -1.5381317138671875, -1.47564697265625, -1.4131622314453125, -1.350677490234375, -1.2881927490234375, -1.2257080078125, -1.1632232666015625, -1.100738525390625, -1.0382537841796875, -0.97576904296875, -0.9132843017578125, -0.850799560546875, -0.7883148193359375, -0.725830078125, -0.6633453369140625, -0.600860595703125, -0.5383758544921875, -0.47589111328125, -0.4134063720703125, -0.350921630859375, -0.2884368896484375, -0.2259521484375, -0.1634674072265625, -0.100982666015625, -0.0384979248046875, 0.02398681640625, 0.0864715576171875, 0.148956298828125, 0.2114410400390625, 0.27392578125, 0.3364105224609375, 0.398895263671875, 0.4613800048828125, 0.52386474609375, 0.5863494873046875, 0.648834228515625, 0.7113189697265625, 0.7738037109375, 0.8362884521484375, 0.898773193359375, 0.9612579345703125, 1.02374267578125, 1.0862274169921875, 1.148712158203125, 1.2111968994140625, 1.273681640625, 1.3361663818359375, 1.398651123046875, 1.4611358642578125, 1.52362060546875, 1.5861053466796875, 1.648590087890625, 1.7110748291015625, 1.7735595703125, 1.8360443115234375, 1.898529052734375, 1.9610137939453125, 2.02349853515625, 2.0859832763671875, 2.148468017578125, 2.2109527587890625, 2.2734375]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 4.0, 6.0, 6.0, 11.0, 28.0, 32.0, 51.0, 90.0, 127.0, 249.0, 138.0, 104.0, 46.0, 37.0, 25.0, 22.0, 7.0, 7.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.9521484375, -0.9312896728515625, -0.910430908203125, -0.8895721435546875, -0.86871337890625, -0.8478546142578125, -0.826995849609375, -0.8061370849609375, -0.7852783203125, -0.7644195556640625, -0.743560791015625, -0.7227020263671875, -0.70184326171875, -0.6809844970703125, -0.660125732421875, -0.6392669677734375, -0.618408203125, -0.5975494384765625, -0.576690673828125, -0.5558319091796875, -0.53497314453125, -0.5141143798828125, -0.493255615234375, -0.4723968505859375, -0.4515380859375, -0.4306793212890625, -0.409820556640625, -0.3889617919921875, -0.36810302734375, -0.3472442626953125, -0.326385498046875, -0.3055267333984375, -0.28466796875, -0.2638092041015625, -0.242950439453125, -0.2220916748046875, -0.20123291015625, -0.1803741455078125, -0.159515380859375, -0.1386566162109375, -0.1177978515625, -0.0969390869140625, -0.076080322265625, -0.0552215576171875, -0.03436279296875, -0.0135040283203125, 0.007354736328125, 0.0282135009765625, 0.049072265625, 0.0699310302734375, 0.090789794921875, 0.1116485595703125, 0.13250732421875, 0.1533660888671875, 0.174224853515625, 0.1950836181640625, 0.2159423828125, 0.2368011474609375, 0.257659912109375, 0.2785186767578125, 0.29937744140625, 0.3202362060546875, 0.341094970703125, 0.3619537353515625, 0.3828125]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 14.0, 90.0, 314.0, 399.0, 158.0, 30.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-39.453025817871094, -38.737335205078125, -38.021644592285156, -37.30595397949219, -36.59026336669922, -35.874576568603516, -35.15888595581055, -34.44319534301758, -33.72750473022461, -33.01181411743164, -32.29612350463867, -31.580434799194336, -30.864744186401367, -30.1490535736084, -29.433364868164062, -28.717674255371094, -28.001983642578125, -27.286293029785156, -26.570602416992188, -25.85491371154785, -25.139223098754883, -24.423532485961914, -23.707843780517578, -22.99215316772461, -22.27646255493164, -21.560771942138672, -20.845081329345703, -20.129392623901367, -19.4137020111084, -18.69801139831543, -17.982322692871094, -17.266632080078125, -16.550941467285156, -15.835250854492188, -15.119561195373535, -14.403871536254883, -13.688180923461914, -12.972490310668945, -12.256800651550293, -11.54111099243164, -10.825420379638672, -10.109729766845703, -9.39404010772705, -8.678350448608398, -7.96265983581543, -7.246969699859619, -6.531279563903809, -5.815589427947998, -5.0998992919921875, -4.384209156036377, -3.6685190200805664, -2.952828884124756, -2.2371387481689453, -1.5214486122131348, -0.8057584762573242, -0.09006834030151367, 0.6256217956542969, 1.3413119316101074, 2.057002067565918, 2.7726922035217285, 3.488382339477539, 4.20407247543335, 4.91976261138916, 5.635452747344971, 6.351142883300781]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 7.0, 3.0, 11.0, 11.0, 12.0, 12.0, 14.0, 20.0, 20.0, 23.0, 29.0, 23.0, 32.0, 35.0, 40.0, 40.0, 42.0, 56.0, 45.0, 46.0, 47.0, 36.0, 41.0, 38.0, 31.0, 35.0, 40.0, 32.0, 20.0, 30.0, 27.0, 15.0, 15.0, 14.0, 10.0, 12.0, 6.0, 7.0, 7.0, 5.0, 6.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-5.363114356994629, -5.211436748504639, -5.059759616851807, -4.908082008361816, -4.756404876708984, -4.604727268218994, -4.453050136566162, -4.301372528076172, -4.14969539642334, -3.9980180263519287, -3.8463406562805176, -3.6946632862091064, -3.5429859161376953, -3.391308307647705, -3.239630937576294, -3.087953567504883, -2.9362759590148926, -2.7845985889434814, -2.6329212188720703, -2.481243848800659, -2.329566478729248, -2.177888870239258, -2.0262115001678467, -1.8745341300964355, -1.7228567600250244, -1.5711793899536133, -1.4195020198822021, -1.2678245306015015, -1.1161471605300903, -0.9644697904586792, -0.8127923607826233, -0.6611149311065674, -0.509437084197998, -0.3577596843242645, -0.206082284450531, -0.054404884576797485, 0.09727251529693604, 0.24894988536834717, 0.4006273150444031, 0.552304744720459, 0.7039821147918701, 0.8556594848632812, 1.0073368549346924, 1.159014344215393, 1.3106917142868042, 1.4623690843582153, 1.614046573638916, 1.7657239437103271, 1.9174013137817383, 2.0690786838531494, 2.2207560539245605, 2.3724334239959717, 2.524110794067383, 2.675788402557373, 2.827465772628784, 2.9791431427001953, 3.1308205127716064, 3.2824978828430176, 3.4341752529144287, 3.58585262298584, 3.73753023147583, 3.889207363128662, 4.040884971618652, 4.192562103271484, 4.344239711761475]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 5.0, 8.0, 7.0, 7.0, 14.0, 11.0, 17.0, 20.0, 22.0, 24.0, 36.0, 56.0, 73.0, 72.0, 101.0, 143.0, 210.0, 356.0, 660.0, 1420.0, 4138.0, 18343.0, 129601.0, 1509500.0, 2284506.0, 211069.0, 25473.0, 5054.0, 1455.0, 645.0, 324.0, 223.0, 147.0, 111.0, 81.0, 74.0, 55.0, 53.0, 31.0, 28.0, 19.0, 21.0, 17.0, 19.0, 9.0, 10.0, 3.0, 3.0, 2.0, 4.0, 5.0, 2.0, 2.0, 2.0, 1.0], "bins": [-3.634765625, -3.524993896484375, -3.41522216796875, -3.305450439453125, -3.1956787109375, -3.085906982421875, -2.97613525390625, -2.866363525390625, -2.756591796875, -2.646820068359375, -2.53704833984375, -2.427276611328125, -2.3175048828125, -2.207733154296875, -2.09796142578125, -1.988189697265625, -1.87841796875, -1.768646240234375, -1.65887451171875, -1.549102783203125, -1.4393310546875, -1.329559326171875, -1.21978759765625, -1.110015869140625, -1.000244140625, -0.890472412109375, -0.78070068359375, -0.670928955078125, -0.5611572265625, -0.451385498046875, -0.34161376953125, -0.231842041015625, -0.1220703125, -0.012298583984375, 0.09747314453125, 0.207244873046875, 0.3170166015625, 0.426788330078125, 0.53656005859375, 0.646331787109375, 0.756103515625, 0.865875244140625, 0.97564697265625, 1.085418701171875, 1.1951904296875, 1.304962158203125, 1.41473388671875, 1.524505615234375, 1.63427734375, 1.744049072265625, 1.85382080078125, 1.963592529296875, 2.0733642578125, 2.183135986328125, 2.29290771484375, 2.402679443359375, 2.512451171875, 2.622222900390625, 2.73199462890625, 2.841766357421875, 2.9515380859375, 3.061309814453125, 3.17108154296875, 3.280853271484375, 3.390625]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 4.0, 3.0, 5.0, 3.0, 6.0, 7.0, 10.0, 23.0, 23.0, 21.0, 26.0, 22.0, 36.0, 46.0, 64.0, 54.0, 68.0, 52.0, 56.0, 61.0, 70.0, 56.0, 60.0, 39.0, 38.0, 30.0, 31.0, 21.0, 18.0, 11.0, 13.0, 9.0, 7.0, 5.0, 4.0, 4.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4189453125, -1.3559722900390625, -1.292999267578125, -1.2300262451171875, -1.16705322265625, -1.1040802001953125, -1.041107177734375, -0.9781341552734375, -0.9151611328125, -0.8521881103515625, -0.789215087890625, -0.7262420654296875, -0.66326904296875, -0.6002960205078125, -0.537322998046875, -0.4743499755859375, -0.411376953125, -0.3484039306640625, -0.285430908203125, -0.2224578857421875, -0.15948486328125, -0.0965118408203125, -0.033538818359375, 0.0294342041015625, 0.0924072265625, 0.1553802490234375, 0.218353271484375, 0.2813262939453125, 0.34429931640625, 0.4072723388671875, 0.470245361328125, 0.5332183837890625, 0.59619140625, 0.6591644287109375, 0.722137451171875, 0.7851104736328125, 0.84808349609375, 0.9110565185546875, 0.974029541015625, 1.0370025634765625, 1.0999755859375, 1.1629486083984375, 1.225921630859375, 1.2888946533203125, 1.35186767578125, 1.4148406982421875, 1.477813720703125, 1.5407867431640625, 1.603759765625, 1.6667327880859375, 1.729705810546875, 1.7926788330078125, 1.85565185546875, 1.9186248779296875, 1.981597900390625, 2.0445709228515625, 2.1075439453125, 2.1705169677734375, 2.233489990234375, 2.2964630126953125, 2.35943603515625, 2.4224090576171875, 2.485382080078125, 2.5483551025390625, 2.611328125]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 11.0, 12.0, 26.0, 74.0, 178.0, 595.0, 3535.0, 180510.0, 3987668.0, 19509.0, 1584.0, 343.0, 114.0, 49.0, 29.0, 14.0, 9.0, 11.0, 4.0, 3.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.89453125, -5.55352783203125, -5.2125244140625, -4.87152099609375, -4.530517578125, -4.18951416015625, -3.8485107421875, -3.50750732421875, -3.16650390625, -2.82550048828125, -2.4844970703125, -2.14349365234375, -1.802490234375, -1.46148681640625, -1.1204833984375, -0.77947998046875, -0.4384765625, -0.09747314453125, 0.2435302734375, 0.58453369140625, 0.925537109375, 1.26654052734375, 1.6075439453125, 1.94854736328125, 2.28955078125, 2.63055419921875, 2.9715576171875, 3.31256103515625, 3.653564453125, 3.99456787109375, 4.3355712890625, 4.67657470703125, 5.017578125, 5.35858154296875, 5.6995849609375, 6.04058837890625, 6.381591796875, 6.72259521484375, 7.0635986328125, 7.40460205078125, 7.74560546875, 8.08660888671875, 8.4276123046875, 8.76861572265625, 9.109619140625, 9.45062255859375, 9.7916259765625, 10.13262939453125, 10.4736328125, 10.81463623046875, 11.1556396484375, 11.49664306640625, 11.837646484375, 12.17864990234375, 12.5196533203125, 12.86065673828125, 13.20166015625, 13.54266357421875, 13.8836669921875, 14.22467041015625, 14.565673828125, 14.90667724609375, 15.2476806640625, 15.58868408203125, 15.9296875]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 6.0, 5.0, 5.0, 5.0, 11.0, 23.0, 35.0, 47.0, 73.0, 115.0, 226.0, 355.0, 534.0, 745.0, 655.0, 480.0, 280.0, 192.0, 100.0, 64.0, 40.0, 29.0, 12.0, 12.0, 8.0, 3.0, 6.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-1.7763671875, -1.7358932495117188, -1.6954193115234375, -1.6549453735351562, -1.614471435546875, -1.5739974975585938, -1.5335235595703125, -1.4930496215820312, -1.45257568359375, -1.4121017456054688, -1.3716278076171875, -1.3311538696289062, -1.290679931640625, -1.2502059936523438, -1.2097320556640625, -1.1692581176757812, -1.1287841796875, -1.0883102416992188, -1.0478363037109375, -1.0073623657226562, -0.966888427734375, -0.9264144897460938, -0.8859405517578125, -0.8454666137695312, -0.80499267578125, -0.7645187377929688, -0.7240447998046875, -0.6835708618164062, -0.643096923828125, -0.6026229858398438, -0.5621490478515625, -0.5216751098632812, -0.481201171875, -0.44072723388671875, -0.4002532958984375, -0.35977935791015625, -0.319305419921875, -0.27883148193359375, -0.2383575439453125, -0.19788360595703125, -0.15740966796875, -0.11693572998046875, -0.0764617919921875, -0.03598785400390625, 0.004486083984375, 0.04496002197265625, 0.0854339599609375, 0.12590789794921875, 0.1663818359375, 0.20685577392578125, 0.2473297119140625, 0.28780364990234375, 0.328277587890625, 0.36875152587890625, 0.4092254638671875, 0.44969940185546875, 0.49017333984375, 0.5306472778320312, 0.5711212158203125, 0.6115951538085938, 0.652069091796875, 0.6925430297851562, 0.7330169677734375, 0.7734909057617188, 0.81396484375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 9.0, 8.0, 14.0, 14.0, 29.0, 26.0, 36.0, 46.0, 49.0, 63.0, 91.0, 72.0, 75.0, 74.0, 76.0, 73.0, 58.0, 46.0, 42.0, 38.0, 24.0, 14.0, 11.0, 9.0, 7.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.992717981338501, -1.8936253786087036, -1.7945326566696167, -1.6954400539398193, -1.5963473320007324, -1.497254729270935, -1.3981621265411377, -1.2990694046020508, -1.1999768018722534, -1.100884199142456, -1.0017914772033691, -0.9026988744735718, -0.8036062121391296, -0.7045135498046875, -0.6054209470748901, -0.506328284740448, -0.40723562240600586, -0.3081429600715637, -0.20905032753944397, -0.10995769500732422, -0.01086503267288208, 0.08822762966156006, 0.18732023239135742, 0.28641289472579956, 0.3855055570602417, 0.48459821939468384, 0.583690881729126, 0.6827834844589233, 0.7818761467933655, 0.8809688091278076, 0.980061411857605, 1.0791540145874023, 1.1782464981079102, 1.2773391008377075, 1.3764318227767944, 1.4755244255065918, 1.5746171474456787, 1.673709750175476, 1.7728023529052734, 1.8718950748443604, 1.9709876775741577, 2.070080280303955, 2.169173002243042, 2.268265724182129, 2.3673582077026367, 2.4664509296417236, 2.5655436515808105, 2.6646361351013184, 2.7637288570404053, 2.862821578979492, 2.9619140625, 3.061006784439087, 3.160099506378174, 3.2591919898986816, 3.3582847118377686, 3.4573774337768555, 3.5564699172973633, 3.65556263923645, 3.754655122756958, 3.853747844696045, 3.952840566635132, 4.051933288574219, 4.151025772094727, 4.250118255615234, 4.3492112159729]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 6.0, 3.0, 4.0, 5.0, 10.0, 5.0, 7.0, 14.0, 16.0, 15.0, 14.0, 12.0, 38.0, 22.0, 26.0, 32.0, 31.0, 38.0, 36.0, 48.0, 43.0, 37.0, 41.0, 36.0, 29.0, 44.0, 39.0, 35.0, 33.0, 30.0, 32.0, 22.0, 32.0, 29.0, 30.0, 14.0, 18.0, 13.0, 12.0, 5.0, 10.0, 12.0, 5.0, 9.0, 6.0, 1.0, 2.0, 3.0, 0.0, 2.0, 2.0, 2.0], "bins": [-1.9949958324432373, -1.9377926588058472, -1.880589485168457, -1.823386311531067, -1.7661831378936768, -1.7089799642562866, -1.6517767906188965, -1.594573736190796, -1.5373704433441162, -1.480167269706726, -1.422964096069336, -1.3657609224319458, -1.3085577487945557, -1.2513545751571655, -1.1941514015197754, -1.1369483470916748, -1.0797451734542847, -1.0225419998168945, -0.9653388261795044, -0.9081356525421143, -0.8509324789047241, -0.793729305267334, -0.7365261912345886, -0.6793230175971985, -0.6221198439598083, -0.5649166703224182, -0.5077134966850281, -0.4505103528499603, -0.3933071792125702, -0.33610400557518005, -0.2789008617401123, -0.22169768810272217, -0.16449439525604248, -0.10729122906923294, -0.0500880628824234, 0.007115095853805542, 0.06431826949119568, 0.12152144312858582, 0.17872458696365356, 0.2359277606010437, 0.29313093423843384, 0.350334107875824, 0.4075372815132141, 0.46474042534828186, 0.5219435691833496, 0.5791467428207397, 0.6363499164581299, 0.69355309009552, 0.7507562637329102, 0.8079594373703003, 0.8651626110076904, 0.9223657846450806, 0.9795689582824707, 1.0367721319198608, 1.093975305557251, 1.1511783599853516, 1.2083816528320312, 1.2655848264694214, 1.3227880001068115, 1.3799911737442017, 1.4371943473815918, 1.494397521018982, 1.551600694656372, 1.6088037490844727, 1.6660069227218628]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 4.0, 11.0, 4.0, 14.0, 11.0, 13.0, 29.0, 24.0, 35.0, 36.0, 77.0, 70.0, 129.0, 192.0, 319.0, 607.0, 1120.0, 2195.0, 5134.0, 13797.0, 42934.0, 145486.0, 385062.0, 305963.0, 98251.0, 29254.0, 9798.0, 3933.0, 1768.0, 921.0, 486.0, 278.0, 174.0, 103.0, 87.0, 59.0, 36.0, 40.0, 32.0, 16.0, 7.0, 16.0, 15.0, 5.0, 4.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.455078125, -0.43982696533203125, -0.4245758056640625, -0.40932464599609375, -0.394073486328125, -0.37882232666015625, -0.3635711669921875, -0.34832000732421875, -0.33306884765625, -0.31781768798828125, -0.3025665283203125, -0.28731536865234375, -0.272064208984375, -0.25681304931640625, -0.2415618896484375, -0.22631072998046875, -0.2110595703125, -0.19580841064453125, -0.1805572509765625, -0.16530609130859375, -0.150054931640625, -0.13480377197265625, -0.1195526123046875, -0.10430145263671875, -0.08905029296875, -0.07379913330078125, -0.0585479736328125, -0.04329681396484375, -0.028045654296875, -0.01279449462890625, 0.0024566650390625, 0.01770782470703125, 0.032958984375, 0.04821014404296875, 0.0634613037109375, 0.07871246337890625, 0.093963623046875, 0.10921478271484375, 0.1244659423828125, 0.13971710205078125, 0.15496826171875, 0.17021942138671875, 0.1854705810546875, 0.20072174072265625, 0.215972900390625, 0.23122406005859375, 0.2464752197265625, 0.26172637939453125, 0.2769775390625, 0.29222869873046875, 0.3074798583984375, 0.32273101806640625, 0.337982177734375, 0.35323333740234375, 0.3684844970703125, 0.38373565673828125, 0.39898681640625, 0.41423797607421875, 0.4294891357421875, 0.44474029541015625, 0.459991455078125, 0.47524261474609375, 0.4904937744140625, 0.5057449340820312, 0.52099609375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 7.0, 7.0, 3.0, 6.0, 10.0, 9.0, 7.0, 15.0, 16.0, 16.0, 34.0, 22.0, 39.0, 33.0, 32.0, 37.0, 54.0, 44.0, 49.0, 38.0, 46.0, 37.0, 33.0, 52.0, 29.0, 35.0, 31.0, 31.0, 32.0, 25.0, 39.0, 23.0, 22.0, 17.0, 11.0, 9.0, 14.0, 5.0, 9.0, 7.0, 8.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.126953125, -1.0890655517578125, -1.051177978515625, -1.0132904052734375, -0.97540283203125, -0.9375152587890625, -0.899627685546875, -0.8617401123046875, -0.8238525390625, -0.7859649658203125, -0.748077392578125, -0.7101898193359375, -0.67230224609375, -0.6344146728515625, -0.596527099609375, -0.5586395263671875, -0.520751953125, -0.4828643798828125, -0.444976806640625, -0.4070892333984375, -0.36920166015625, -0.3313140869140625, -0.293426513671875, -0.2555389404296875, -0.2176513671875, -0.1797637939453125, -0.141876220703125, -0.1039886474609375, -0.06610107421875, -0.0282135009765625, 0.009674072265625, 0.0475616455078125, 0.08544921875, 0.1233367919921875, 0.161224365234375, 0.1991119384765625, 0.23699951171875, 0.2748870849609375, 0.312774658203125, 0.3506622314453125, 0.3885498046875, 0.4264373779296875, 0.464324951171875, 0.5022125244140625, 0.54010009765625, 0.5779876708984375, 0.615875244140625, 0.6537628173828125, 0.691650390625, 0.7295379638671875, 0.767425537109375, 0.8053131103515625, 0.84320068359375, 0.8810882568359375, 0.918975830078125, 0.9568634033203125, 0.9947509765625, 1.0326385498046875, 1.070526123046875, 1.1084136962890625, 1.14630126953125, 1.1841888427734375, 1.222076416015625, 1.2599639892578125, 1.2978515625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 5.0, 7.0, 12.0, 17.0, 22.0, 24.0, 40.0, 69.0, 91.0, 153.0, 198.0, 310.0, 418.0, 666.0, 903.0, 1412.0, 2198.0, 3203.0, 4916.0, 7397.0, 11938.0, 17835.0, 28728.0, 45209.0, 70343.0, 106419.0, 147263.0, 166984.0, 143113.0, 101776.0, 67288.0, 43036.0, 27014.0, 17325.0, 11049.0, 7060.0, 4712.0, 3196.0, 2075.0, 1355.0, 868.0, 632.0, 419.0, 273.0, 196.0, 133.0, 79.0, 60.0, 43.0, 26.0, 20.0, 18.0, 11.0, 6.0, 3.0, 1.0, 0.0, 5.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.130615234375, -0.12618064880371094, -0.12174606323242188, -0.11731147766113281, -0.11287689208984375, -0.10844230651855469, -0.10400772094726562, -0.09957313537597656, -0.0951385498046875, -0.09070396423339844, -0.08626937866210938, -0.08183479309082031, -0.07740020751953125, -0.07296562194824219, -0.06853103637695312, -0.06409645080566406, -0.059661865234375, -0.05522727966308594, -0.050792694091796875, -0.04635810852050781, -0.04192352294921875, -0.03748893737792969, -0.033054351806640625, -0.028619766235351562, -0.0241851806640625, -0.019750595092773438, -0.015316009521484375, -0.010881423950195312, -0.00644683837890625, -0.0020122528076171875, 0.002422332763671875, 0.0068569183349609375, 0.01129150390625, 0.015726089477539062, 0.020160675048828125, 0.024595260620117188, 0.02902984619140625, 0.03346443176269531, 0.037899017333984375, 0.04233360290527344, 0.0467681884765625, 0.05120277404785156, 0.055637359619140625, 0.06007194519042969, 0.06450653076171875, 0.06894111633300781, 0.07337570190429688, 0.07781028747558594, 0.082244873046875, 0.08667945861816406, 0.09111404418945312, 0.09554862976074219, 0.09998321533203125, 0.10441780090332031, 0.10885238647460938, 0.11328697204589844, 0.1177215576171875, 0.12215614318847656, 0.12659072875976562, 0.1310253143310547, 0.13545989990234375, 0.1398944854736328, 0.14432907104492188, 0.14876365661621094, 0.1531982421875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 4.0, 1.0, 2.0, 11.0, 5.0, 5.0, 8.0, 11.0, 10.0, 9.0, 10.0, 12.0, 12.0, 23.0, 17.0, 31.0, 26.0, 43.0, 59.0, 43.0, 49.0, 47.0, 57.0, 47.0, 61.0, 47.0, 49.0, 49.0, 36.0, 32.0, 27.0, 25.0, 23.0, 21.0, 18.0, 20.0, 5.0, 12.0, 9.0, 6.0, 6.0, 5.0, 2.0, 5.0, 7.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.384765625, -2.303955078125, -2.22314453125, -2.142333984375, -2.0615234375, -1.980712890625, -1.89990234375, -1.819091796875, -1.73828125, -1.657470703125, -1.57666015625, -1.495849609375, -1.4150390625, -1.334228515625, -1.25341796875, -1.172607421875, -1.091796875, -1.010986328125, -0.93017578125, -0.849365234375, -0.7685546875, -0.687744140625, -0.60693359375, -0.526123046875, -0.4453125, -0.364501953125, -0.28369140625, -0.202880859375, -0.1220703125, -0.041259765625, 0.03955078125, 0.120361328125, 0.201171875, 0.281982421875, 0.36279296875, 0.443603515625, 0.5244140625, 0.605224609375, 0.68603515625, 0.766845703125, 0.84765625, 0.928466796875, 1.00927734375, 1.090087890625, 1.1708984375, 1.251708984375, 1.33251953125, 1.413330078125, 1.494140625, 1.574951171875, 1.65576171875, 1.736572265625, 1.8173828125, 1.898193359375, 1.97900390625, 2.059814453125, 2.140625, 2.221435546875, 2.30224609375, 2.383056640625, 2.4638671875, 2.544677734375, 2.62548828125, 2.706298828125, 2.787109375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 7.0, 0.0, 4.0, 8.0, 7.0, 11.0, 7.0, 15.0, 25.0, 24.0, 37.0, 34.0, 62.0, 87.0, 111.0, 271.0, 471.0, 991.0, 2387.0, 6361.0, 22725.0, 101018.0, 421420.0, 376333.0, 86539.0, 19529.0, 5918.0, 2069.0, 938.0, 480.0, 222.0, 138.0, 91.0, 59.0, 40.0, 30.0, 19.0, 14.0, 17.0, 9.0, 5.0, 7.0, 8.0, 3.0, 5.0, 4.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0611572265625, -0.05918121337890625, -0.0572052001953125, -0.05522918701171875, -0.053253173828125, -0.05127716064453125, -0.0493011474609375, -0.04732513427734375, -0.04534912109375, -0.04337310791015625, -0.0413970947265625, -0.03942108154296875, -0.037445068359375, -0.03546905517578125, -0.0334930419921875, -0.03151702880859375, -0.029541015625, -0.02756500244140625, -0.0255889892578125, -0.02361297607421875, -0.021636962890625, -0.01966094970703125, -0.0176849365234375, -0.01570892333984375, -0.01373291015625, -0.01175689697265625, -0.0097808837890625, -0.00780487060546875, -0.005828857421875, -0.00385284423828125, -0.0018768310546875, 9.918212890625e-05, 0.0020751953125, 0.00405120849609375, 0.0060272216796875, 0.00800323486328125, 0.009979248046875, 0.01195526123046875, 0.0139312744140625, 0.01590728759765625, 0.01788330078125, 0.01985931396484375, 0.0218353271484375, 0.02381134033203125, 0.025787353515625, 0.02776336669921875, 0.0297393798828125, 0.03171539306640625, 0.03369140625, 0.03566741943359375, 0.0376434326171875, 0.03961944580078125, 0.041595458984375, 0.04357147216796875, 0.0455474853515625, 0.04752349853515625, 0.04949951171875, 0.05147552490234375, 0.0534515380859375, 0.05542755126953125, 0.057403564453125, 0.05937957763671875, 0.0613555908203125, 0.06333160400390625, 0.0653076171875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 1.0, 3.0, 3.0, 7.0, 21.0, 18.0, 26.0, 31.0, 52.0, 64.0, 71.0, 141.0, 104.0, 132.0, 93.0, 61.0, 52.0, 31.0, 20.0, 26.0, 12.0, 10.0, 13.0, 5.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.459785461425781e-05, -5.317572504281998e-05, -5.175359547138214e-05, -5.0331465899944305e-05, -4.890933632850647e-05, -4.7487206757068634e-05, -4.60650771856308e-05, -4.464294761419296e-05, -4.322081804275513e-05, -4.179868847131729e-05, -4.0376558899879456e-05, -3.895442932844162e-05, -3.7532299757003784e-05, -3.611017018556595e-05, -3.468804061412811e-05, -3.326591104269028e-05, -3.184378147125244e-05, -3.0421651899814606e-05, -2.899952232837677e-05, -2.7577392756938934e-05, -2.61552631855011e-05, -2.4733133614063263e-05, -2.3311004042625427e-05, -2.188887447118759e-05, -2.0466744899749756e-05, -1.904461532831192e-05, -1.7622485756874084e-05, -1.620035618543625e-05, -1.4778226613998413e-05, -1.3356097042560577e-05, -1.1933967471122742e-05, -1.0511837899684906e-05, -9.08970832824707e-06, -7.667578756809235e-06, -6.245449185371399e-06, -4.823319613933563e-06, -3.4011900424957275e-06, -1.979060471057892e-06, -5.569308996200562e-07, 8.651986718177795e-07, 2.2873282432556152e-06, 3.709457814693451e-06, 5.131587386131287e-06, 6.553716957569122e-06, 7.975846529006958e-06, 9.397976100444794e-06, 1.082010567188263e-05, 1.2242235243320465e-05, 1.36643648147583e-05, 1.5086494386196136e-05, 1.6508623957633972e-05, 1.7930753529071808e-05, 1.9352883100509644e-05, 2.077501267194748e-05, 2.2197142243385315e-05, 2.361927181482315e-05, 2.5041401386260986e-05, 2.6463530957698822e-05, 2.7885660529136658e-05, 2.9307790100574493e-05, 3.072991967201233e-05, 3.2152049243450165e-05, 3.3574178814888e-05, 3.4996308386325836e-05, 3.641843795776367e-05]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 3.0, 9.0, 5.0, 11.0, 11.0, 26.0, 32.0, 51.0, 79.0, 142.0, 253.0, 452.0, 912.0, 1998.0, 4996.0, 14232.0, 52652.0, 231600.0, 514506.0, 168309.0, 39279.0, 11492.0, 4039.0, 1721.0, 784.0, 422.0, 213.0, 120.0, 72.0, 50.0, 28.0, 19.0, 7.0, 13.0, 6.0, 5.0, 4.0, 5.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.075927734375, -0.0736541748046875, -0.071380615234375, -0.0691070556640625, -0.06683349609375, -0.0645599365234375, -0.062286376953125, -0.0600128173828125, -0.0577392578125, -0.0554656982421875, -0.053192138671875, -0.0509185791015625, -0.04864501953125, -0.0463714599609375, -0.044097900390625, -0.0418243408203125, -0.03955078125, -0.0372772216796875, -0.035003662109375, -0.0327301025390625, -0.03045654296875, -0.0281829833984375, -0.025909423828125, -0.0236358642578125, -0.0213623046875, -0.0190887451171875, -0.016815185546875, -0.0145416259765625, -0.01226806640625, -0.0099945068359375, -0.007720947265625, -0.0054473876953125, -0.003173828125, -0.0009002685546875, 0.001373291015625, 0.0036468505859375, 0.00592041015625, 0.0081939697265625, 0.010467529296875, 0.0127410888671875, 0.0150146484375, 0.0172882080078125, 0.019561767578125, 0.0218353271484375, 0.02410888671875, 0.0263824462890625, 0.028656005859375, 0.0309295654296875, 0.033203125, 0.0354766845703125, 0.037750244140625, 0.0400238037109375, 0.04229736328125, 0.0445709228515625, 0.046844482421875, 0.0491180419921875, 0.0513916015625, 0.0536651611328125, 0.055938720703125, 0.0582122802734375, 0.06048583984375, 0.0627593994140625, 0.065032958984375, 0.0673065185546875, 0.069580078125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 9.0, 12.0, 14.0, 18.0, 20.0, 47.0, 35.0, 43.0, 53.0, 77.0, 100.0, 94.0, 93.0, 103.0, 66.0, 52.0, 43.0, 34.0, 19.0, 15.0, 3.0, 9.0, 13.0, 4.0, 1.0, 10.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.01702880859375, -0.01648569107055664, -0.01594257354736328, -0.015399456024169922, -0.014856338500976562, -0.014313220977783203, -0.013770103454589844, -0.013226985931396484, -0.012683868408203125, -0.012140750885009766, -0.011597633361816406, -0.011054515838623047, -0.010511398315429688, -0.009968280792236328, -0.009425163269042969, -0.00888204574584961, -0.00833892822265625, -0.007795810699462891, -0.007252693176269531, -0.006709575653076172, -0.0061664581298828125, -0.005623340606689453, -0.005080223083496094, -0.004537105560302734, -0.003993988037109375, -0.0034508705139160156, -0.0029077529907226562, -0.002364635467529297, -0.0018215179443359375, -0.0012784004211425781, -0.0007352828979492188, -0.00019216537475585938, 0.0003509521484375, 0.0008940696716308594, 0.0014371871948242188, 0.001980304718017578, 0.0025234222412109375, 0.003066539764404297, 0.0036096572875976562, 0.004152774810791016, 0.004695892333984375, 0.005239009857177734, 0.005782127380371094, 0.006325244903564453, 0.0068683624267578125, 0.007411479949951172, 0.007954597473144531, 0.00849771499633789, 0.00904083251953125, 0.00958395004272461, 0.010127067565917969, 0.010670185089111328, 0.011213302612304688, 0.011756420135498047, 0.012299537658691406, 0.012842655181884766, 0.013385772705078125, 0.013928890228271484, 0.014472007751464844, 0.015015125274658203, 0.015558242797851562, 0.016101360321044922, 0.01664447784423828, 0.01718759536743164, 0.017730712890625]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 12.0, 15.0, 17.0, 35.0, 40.0, 53.0, 69.0, 86.0, 100.0, 103.0, 80.0, 79.0, 81.0, 72.0, 47.0, 41.0, 25.0, 21.0, 8.0, 5.0, 4.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.608171820640564, -1.5410289764404297, -1.4738860130310059, -1.406743049621582, -1.3396002054214478, -1.2724573612213135, -1.2053143978118896, -1.1381714344024658, -1.0710285902023315, -1.0038857460021973, -0.9367427825927734, -0.8695998787879944, -0.8024569749832153, -0.7353140711784363, -0.6681711673736572, -0.6010282635688782, -0.5338853597640991, -0.46674245595932007, -0.399599552154541, -0.33245664834976196, -0.2653137445449829, -0.19817084074020386, -0.1310279369354248, -0.06388503313064575, 0.0032578706741333008, 0.07040077447891235, 0.1375436782836914, 0.20468658208847046, 0.2718294858932495, 0.33897238969802856, 0.4061152935028076, 0.47325819730758667, 0.5404009819030762, 0.6075438857078552, 0.6746867895126343, 0.7418296933174133, 0.8089725971221924, 0.8761155009269714, 0.9432584047317505, 1.0104012489318848, 1.0775442123413086, 1.1446871757507324, 1.2118300199508667, 1.278972864151001, 1.3461158275604248, 1.4132587909698486, 1.480401635169983, 1.5475444793701172, 1.614687442779541, 1.6818304061889648, 1.7489732503890991, 1.8161160945892334, 1.8832590579986572, 1.950402021408081, 2.017544746398926, 2.0846877098083496, 2.1518306732177734, 2.2189736366271973, 2.286116600036621, 2.353259325027466, 2.4204022884368896, 2.4875452518463135, 2.554687976837158, 2.621830940246582, 2.688973903656006]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 11.0, 5.0, 4.0, 9.0, 7.0, 11.0, 22.0, 15.0, 17.0, 20.0, 31.0, 25.0, 36.0, 33.0, 47.0, 42.0, 53.0, 43.0, 43.0, 42.0, 35.0, 40.0, 47.0, 29.0, 42.0, 34.0, 35.0, 29.0, 30.0, 33.0, 20.0, 15.0, 18.0, 16.0, 5.0, 9.0, 12.0, 11.0, 8.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.0681788921356201, -1.0322232246398926, -0.9962676763534546, -0.9603120684623718, -0.9243564605712891, -0.8884008526802063, -0.8524452447891235, -0.8164896368980408, -0.780534029006958, -0.7445784211158752, -0.7086228132247925, -0.6726672053337097, -0.636711597442627, -0.6007559895515442, -0.5648003816604614, -0.5288447737693787, -0.4928891658782959, -0.45693355798721313, -0.42097795009613037, -0.3850223422050476, -0.34906673431396484, -0.3131111264228821, -0.2771555185317993, -0.24119991064071655, -0.2052443027496338, -0.16928869485855103, -0.13333308696746826, -0.0973774790763855, -0.061421871185302734, -0.02546626329421997, 0.010489344596862793, 0.04644495248794556, 0.08240056037902832, 0.11835616827011108, 0.15431177616119385, 0.1902673840522766, 0.22622299194335938, 0.26217859983444214, 0.2981342077255249, 0.33408981561660767, 0.37004542350769043, 0.4060010313987732, 0.44195663928985596, 0.4779122471809387, 0.5138678550720215, 0.5498234629631042, 0.585779070854187, 0.6217346787452698, 0.6576902866363525, 0.6936458945274353, 0.7296015024185181, 0.7655571103096008, 0.8015127182006836, 0.8374683260917664, 0.8734239339828491, 0.9093795418739319, 0.9453351497650146, 0.9812907576560974, 1.0172463655471802, 1.0532019138336182, 1.0891575813293457, 1.1251132488250732, 1.1610687971115112, 1.1970243453979492, 1.2329800128936768]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 6.0, 2.0, 3.0, 8.0, 11.0, 21.0, 24.0, 27.0, 47.0, 69.0, 101.0, 134.0, 207.0, 400.0, 740.0, 1560.0, 3467.0, 8234.0, 21163.0, 56840.0, 153402.0, 360391.0, 275089.0, 102906.0, 38251.0, 14514.0, 5782.0, 2494.0, 1203.0, 578.0, 306.0, 188.0, 123.0, 87.0, 59.0, 34.0, 32.0, 19.0, 13.0, 7.0, 10.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5390625, -1.48370361328125, -1.4283447265625, -1.37298583984375, -1.317626953125, -1.26226806640625, -1.2069091796875, -1.15155029296875, -1.09619140625, -1.04083251953125, -0.9854736328125, -0.93011474609375, -0.874755859375, -0.81939697265625, -0.7640380859375, -0.70867919921875, -0.6533203125, -0.59796142578125, -0.5426025390625, -0.48724365234375, -0.431884765625, -0.37652587890625, -0.3211669921875, -0.26580810546875, -0.21044921875, -0.15509033203125, -0.0997314453125, -0.04437255859375, 0.010986328125, 0.06634521484375, 0.1217041015625, 0.17706298828125, 0.232421875, 0.28778076171875, 0.3431396484375, 0.39849853515625, 0.453857421875, 0.50921630859375, 0.5645751953125, 0.61993408203125, 0.67529296875, 0.73065185546875, 0.7860107421875, 0.84136962890625, 0.896728515625, 0.95208740234375, 1.0074462890625, 1.06280517578125, 1.1181640625, 1.17352294921875, 1.2288818359375, 1.28424072265625, 1.339599609375, 1.39495849609375, 1.4503173828125, 1.50567626953125, 1.56103515625, 1.61639404296875, 1.6717529296875, 1.72711181640625, 1.782470703125, 1.83782958984375, 1.8931884765625, 1.94854736328125, 2.00390625]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 7.0, 5.0, 8.0, 10.0, 13.0, 10.0, 9.0, 19.0, 17.0, 19.0, 26.0, 35.0, 41.0, 42.0, 52.0, 39.0, 53.0, 56.0, 57.0, 50.0, 42.0, 51.0, 42.0, 42.0, 35.0, 41.0, 25.0, 24.0, 26.0, 23.0, 15.0, 22.0, 7.0, 13.0, 8.0, 7.0, 5.0, 5.0, 4.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.19921875, -2.11737060546875, -2.0355224609375, -1.95367431640625, -1.871826171875, -1.78997802734375, -1.7081298828125, -1.62628173828125, -1.54443359375, -1.46258544921875, -1.3807373046875, -1.29888916015625, -1.217041015625, -1.13519287109375, -1.0533447265625, -0.97149658203125, -0.8896484375, -0.80780029296875, -0.7259521484375, -0.64410400390625, -0.562255859375, -0.48040771484375, -0.3985595703125, -0.31671142578125, -0.23486328125, -0.15301513671875, -0.0711669921875, 0.01068115234375, 0.092529296875, 0.17437744140625, 0.2562255859375, 0.33807373046875, 0.419921875, 0.50177001953125, 0.5836181640625, 0.66546630859375, 0.747314453125, 0.82916259765625, 0.9110107421875, 0.99285888671875, 1.07470703125, 1.15655517578125, 1.2384033203125, 1.32025146484375, 1.402099609375, 1.48394775390625, 1.5657958984375, 1.64764404296875, 1.7294921875, 1.81134033203125, 1.8931884765625, 1.97503662109375, 2.056884765625, 2.13873291015625, 2.2205810546875, 2.30242919921875, 2.38427734375, 2.46612548828125, 2.5479736328125, 2.62982177734375, 2.711669921875, 2.79351806640625, 2.8753662109375, 2.95721435546875, 3.0390625]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 2.0, 5.0, 5.0, 10.0, 11.0, 12.0, 17.0, 23.0, 29.0, 34.0, 56.0, 91.0, 129.0, 169.0, 198.0, 350.0, 695.0, 2087.0, 9873.0, 65462.0, 448964.0, 443468.0, 63445.0, 9697.0, 1999.0, 663.0, 361.0, 225.0, 123.0, 85.0, 87.0, 50.0, 43.0, 23.0, 25.0, 15.0, 9.0, 6.0, 3.0, 1.0, 0.0, 1.0, 5.0, 2.0, 4.0, 2.0], "bins": [-4.07421875, -3.9697265625, -3.865234375, -3.7607421875, -3.65625, -3.5517578125, -3.447265625, -3.3427734375, -3.23828125, -3.1337890625, -3.029296875, -2.9248046875, -2.8203125, -2.7158203125, -2.611328125, -2.5068359375, -2.40234375, -2.2978515625, -2.193359375, -2.0888671875, -1.984375, -1.8798828125, -1.775390625, -1.6708984375, -1.56640625, -1.4619140625, -1.357421875, -1.2529296875, -1.1484375, -1.0439453125, -0.939453125, -0.8349609375, -0.73046875, -0.6259765625, -0.521484375, -0.4169921875, -0.3125, -0.2080078125, -0.103515625, 0.0009765625, 0.10546875, 0.2099609375, 0.314453125, 0.4189453125, 0.5234375, 0.6279296875, 0.732421875, 0.8369140625, 0.94140625, 1.0458984375, 1.150390625, 1.2548828125, 1.359375, 1.4638671875, 1.568359375, 1.6728515625, 1.77734375, 1.8818359375, 1.986328125, 2.0908203125, 2.1953125, 2.2998046875, 2.404296875, 2.5087890625, 2.61328125]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 4.0, 2.0, 5.0, 5.0, 9.0, 7.0, 10.0, 7.0, 16.0, 17.0, 26.0, 24.0, 35.0, 36.0, 37.0, 50.0, 39.0, 62.0, 51.0, 51.0, 57.0, 56.0, 46.0, 44.0, 43.0, 54.0, 37.0, 37.0, 17.0, 24.0, 18.0, 26.0, 13.0, 9.0, 5.0, 5.0, 5.0, 5.0, 3.0, 5.0, 0.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.392578125, -3.293212890625, -3.19384765625, -3.094482421875, -2.9951171875, -2.895751953125, -2.79638671875, -2.697021484375, -2.59765625, -2.498291015625, -2.39892578125, -2.299560546875, -2.2001953125, -2.100830078125, -2.00146484375, -1.902099609375, -1.802734375, -1.703369140625, -1.60400390625, -1.504638671875, -1.4052734375, -1.305908203125, -1.20654296875, -1.107177734375, -1.0078125, -0.908447265625, -0.80908203125, -0.709716796875, -0.6103515625, -0.510986328125, -0.41162109375, -0.312255859375, -0.212890625, -0.113525390625, -0.01416015625, 0.085205078125, 0.1845703125, 0.283935546875, 0.38330078125, 0.482666015625, 0.58203125, 0.681396484375, 0.78076171875, 0.880126953125, 0.9794921875, 1.078857421875, 1.17822265625, 1.277587890625, 1.376953125, 1.476318359375, 1.57568359375, 1.675048828125, 1.7744140625, 1.873779296875, 1.97314453125, 2.072509765625, 2.171875, 2.271240234375, 2.37060546875, 2.469970703125, 2.5693359375, 2.668701171875, 2.76806640625, 2.867431640625, 2.966796875]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 2.0, 4.0, 3.0, 3.0, 4.0, 5.0, 8.0, 13.0, 19.0, 35.0, 58.0, 99.0, 311.0, 852.0, 3574.0, 31221.0, 592956.0, 393722.0, 21472.0, 2972.0, 719.0, 263.0, 106.0, 56.0, 27.0, 15.0, 14.0, 8.0, 4.0, 4.0, 2.0, 4.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.548828125, -1.5003204345703125, -1.451812744140625, -1.4033050537109375, -1.35479736328125, -1.3062896728515625, -1.257781982421875, -1.2092742919921875, -1.1607666015625, -1.1122589111328125, -1.063751220703125, -1.0152435302734375, -0.96673583984375, -0.9182281494140625, -0.869720458984375, -0.8212127685546875, -0.772705078125, -0.7241973876953125, -0.675689697265625, -0.6271820068359375, -0.57867431640625, -0.5301666259765625, -0.481658935546875, -0.4331512451171875, -0.3846435546875, -0.3361358642578125, -0.287628173828125, -0.2391204833984375, -0.19061279296875, -0.1421051025390625, -0.093597412109375, -0.0450897216796875, 0.00341796875, 0.0519256591796875, 0.100433349609375, 0.1489410400390625, 0.19744873046875, 0.2459564208984375, 0.294464111328125, 0.3429718017578125, 0.3914794921875, 0.4399871826171875, 0.488494873046875, 0.5370025634765625, 0.58551025390625, 0.6340179443359375, 0.682525634765625, 0.7310333251953125, 0.779541015625, 0.8280487060546875, 0.876556396484375, 0.9250640869140625, 0.97357177734375, 1.0220794677734375, 1.070587158203125, 1.1190948486328125, 1.1676025390625, 1.2161102294921875, 1.264617919921875, 1.3131256103515625, 1.36163330078125, 1.4101409912109375, 1.458648681640625, 1.5071563720703125, 1.5556640625]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 5.0, 7.0, 12.0, 18.0, 23.0, 27.0, 55.0, 69.0, 108.0, 162.0, 191.0, 92.0, 71.0, 48.0, 42.0, 29.0, 18.0, 1.0, 7.0, 4.0, 5.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002079010009765625, -0.00020099617540836334, -0.00019409134984016418, -0.00018718652427196503, -0.00018028169870376587, -0.0001733768731355667, -0.00016647204756736755, -0.0001595672219991684, -0.00015266239643096924, -0.00014575757086277008, -0.00013885274529457092, -0.00013194791972637177, -0.0001250430941581726, -0.00011813826858997345, -0.00011123344302177429, -0.00010432861745357513, -9.742379188537598e-05, -9.051896631717682e-05, -8.361414074897766e-05, -7.67093151807785e-05, -6.980448961257935e-05, -6.289966404438019e-05, -5.599483847618103e-05, -4.909001290798187e-05, -4.2185187339782715e-05, -3.528036177158356e-05, -2.83755362033844e-05, -2.1470710635185242e-05, -1.4565885066986084e-05, -7.661059498786926e-06, -7.562339305877686e-07, 6.148591637611389e-06, 1.3053417205810547e-05, 1.9958242774009705e-05, 2.6863068342208862e-05, 3.376789391040802e-05, 4.067271947860718e-05, 4.7577545046806335e-05, 5.448237061500549e-05, 6.138719618320465e-05, 6.829202175140381e-05, 7.519684731960297e-05, 8.210167288780212e-05, 8.900649845600128e-05, 9.591132402420044e-05, 0.0001028161495923996, 0.00010972097516059875, 0.00011662580072879791, 0.00012353062629699707, 0.00013043545186519623, 0.00013734027743339539, 0.00014424510300159454, 0.0001511499285697937, 0.00015805475413799286, 0.00016495957970619202, 0.00017186440527439117, 0.00017876923084259033, 0.0001856740564107895, 0.00019257888197898865, 0.0001994837075471878, 0.00020638853311538696, 0.00021329335868358612, 0.00022019818425178528, 0.00022710300981998444, 0.0002340078353881836]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 5.0, 4.0, 12.0, 19.0, 21.0, 53.0, 84.0, 141.0, 290.0, 516.0, 941.0, 1891.0, 5567.0, 29787.0, 259554.0, 628404.0, 101826.0, 13133.0, 3387.0, 1349.0, 678.0, 354.0, 211.0, 126.0, 67.0, 46.0, 39.0, 13.0, 8.0, 6.0, 5.0, 4.0, 4.0, 5.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2373046875, -1.19775390625, -1.158203125, -1.11865234375, -1.0791015625, -1.03955078125, -1.0, -0.96044921875, -0.9208984375, -0.88134765625, -0.841796875, -0.80224609375, -0.7626953125, -0.72314453125, -0.68359375, -0.64404296875, -0.6044921875, -0.56494140625, -0.525390625, -0.48583984375, -0.4462890625, -0.40673828125, -0.3671875, -0.32763671875, -0.2880859375, -0.24853515625, -0.208984375, -0.16943359375, -0.1298828125, -0.09033203125, -0.05078125, -0.01123046875, 0.0283203125, 0.06787109375, 0.107421875, 0.14697265625, 0.1865234375, 0.22607421875, 0.265625, 0.30517578125, 0.3447265625, 0.38427734375, 0.423828125, 0.46337890625, 0.5029296875, 0.54248046875, 0.58203125, 0.62158203125, 0.6611328125, 0.70068359375, 0.740234375, 0.77978515625, 0.8193359375, 0.85888671875, 0.8984375, 0.93798828125, 0.9775390625, 1.01708984375, 1.056640625, 1.09619140625, 1.1357421875, 1.17529296875, 1.21484375, 1.25439453125, 1.2939453125]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 7.0, 5.0, 9.0, 12.0, 10.0, 26.0, 21.0, 30.0, 55.0, 52.0, 58.0, 67.0, 117.0, 107.0, 94.0, 82.0, 68.0, 42.0, 35.0, 37.0, 23.0, 20.0, 8.0, 4.0, 3.0, 6.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.472412109375, -0.4576530456542969, -0.44289398193359375, -0.4281349182128906, -0.4133758544921875, -0.3986167907714844, -0.38385772705078125, -0.3690986633300781, -0.354339599609375, -0.3395805358886719, -0.32482147216796875, -0.3100624084472656, -0.2953033447265625, -0.2805442810058594, -0.26578521728515625, -0.2510261535644531, -0.23626708984375, -0.22150802612304688, -0.20674896240234375, -0.19198989868164062, -0.1772308349609375, -0.16247177124023438, -0.14771270751953125, -0.13295364379882812, -0.118194580078125, -0.10343551635742188, -0.08867645263671875, -0.07391738891601562, -0.0591583251953125, -0.044399261474609375, -0.02964019775390625, -0.014881134033203125, -0.0001220703125, 0.014636993408203125, 0.02939605712890625, 0.044155120849609375, 0.0589141845703125, 0.07367324829101562, 0.08843231201171875, 0.10319137573242188, 0.117950439453125, 0.13270950317382812, 0.14746856689453125, 0.16222763061523438, 0.1769866943359375, 0.19174575805664062, 0.20650482177734375, 0.22126388549804688, 0.23602294921875, 0.2507820129394531, 0.26554107666015625, 0.2803001403808594, 0.2950592041015625, 0.3098182678222656, 0.32457733154296875, 0.3393363952636719, 0.354095458984375, 0.3688545227050781, 0.38361358642578125, 0.3983726501464844, 0.4131317138671875, 0.4278907775878906, 0.44264984130859375, 0.4574089050292969, 0.47216796875]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [32.0, 188.0, 444.0, 265.0, 77.0, 8.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9749128818511963, -1.2551007270812988, -0.5352885723114014, 0.1845235824584961, 0.9043357372283936, 1.624147891998291, 2.3439600467681885, 3.063771963119507, 3.7835843563079834, 4.503396511077881, 5.223208427429199, 5.943020820617676, 6.662833213806152, 7.382645130157471, 8.102457046508789, 8.822269439697266, 9.542081832885742, 10.261894226074219, 10.981706619262695, 11.701518058776855, 12.421330451965332, 13.141142845153809, 13.860954284667969, 14.580766677856445, 15.300579071044922, 16.0203914642334, 16.740203857421875, 17.46001625061035, 18.179828643798828, 18.899639129638672, 19.61945152282715, 20.339263916015625, 21.05907440185547, 21.778886795043945, 22.498699188232422, 23.2185115814209, 23.938323974609375, 24.65813446044922, 25.377946853637695, 26.097759246826172, 26.81757164001465, 27.537384033203125, 28.2571964263916, 28.977008819580078, 29.696819305419922, 30.4166316986084, 31.136444091796875, 31.85625648498535, 32.57606887817383, 33.29587936401367, 34.01569366455078, 34.735504150390625, 35.455318450927734, 36.17512893676758, 36.89494323730469, 37.61475372314453, 38.334564208984375, 39.05437469482422, 39.77418899536133, 40.49399948120117, 41.21381378173828, 41.933624267578125, 42.653438568115234, 43.37324905395508, 44.09306335449219]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 6.0, 4.0, 3.0, 5.0, 7.0, 5.0, 6.0, 11.0, 17.0, 20.0, 14.0, 16.0, 23.0, 21.0, 28.0, 25.0, 34.0, 18.0, 33.0, 40.0, 46.0, 33.0, 43.0, 39.0, 45.0, 43.0, 27.0, 37.0, 34.0, 39.0, 43.0, 39.0, 29.0, 19.0, 22.0, 19.0, 22.0, 19.0, 12.0, 10.0, 10.0, 5.0, 6.0, 5.0, 4.0, 4.0, 4.0, 7.0, 4.0, 3.0, 2.0, 3.0], "bins": [-4.561337471008301, -4.434465408325195, -4.307592868804932, -4.180720806121826, -4.053848743438721, -3.926976442337036, -3.8001041412353516, -3.673232078552246, -3.5463597774505615, -3.419487476348877, -3.2926154136657715, -3.165743112564087, -3.0388708114624023, -2.911998748779297, -2.7851264476776123, -2.6582541465759277, -2.5313820838928223, -2.4045097827911377, -2.2776377201080322, -2.1507654190063477, -2.023893356323242, -1.8970210552215576, -1.770148754119873, -1.643276572227478, -1.516404390335083, -1.389532208442688, -1.262660026550293, -1.1357877254486084, -1.0089155435562134, -0.8820433616638184, -0.7551711201667786, -0.6282988786697388, -0.501427173614502, -0.37455496191978455, -0.24768275022506714, -0.12081053853034973, 0.006061673164367676, 0.1329338550567627, 0.2598060965538025, 0.3866783380508423, 0.5135505199432373, 0.6404227018356323, 0.7672949433326721, 0.8941671848297119, 1.021039366722107, 1.147911548614502, 1.2747838497161865, 1.4016560316085815, 1.5285282135009766, 1.6554003953933716, 1.7822725772857666, 1.9091448783874512, 2.0360169410705566, 2.162889242172241, 2.289761543273926, 2.4166336059570312, 2.543505907058716, 2.6703782081604004, 2.797250270843506, 2.9241225719451904, 3.050994873046875, 3.1778669357299805, 3.304739236831665, 3.4316115379333496, 3.558483600616455]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 3.0, 0.0, 4.0, 1.0, 6.0, 6.0, 5.0, 8.0, 4.0, 9.0, 9.0, 14.0, 12.0, 15.0, 14.0, 31.0, 39.0, 41.0, 41.0, 88.0, 162.0, 232.0, 444.0, 1052.0, 3105.0, 12324.0, 74043.0, 783381.0, 2741721.0, 512811.0, 51192.0, 8957.0, 2412.0, 974.0, 405.0, 228.0, 145.0, 80.0, 56.0, 50.0, 35.0, 25.0, 18.0, 13.0, 22.0, 11.0, 7.0, 5.0, 4.0, 5.0, 3.0, 8.0, 3.0, 5.0, 2.0, 1.0, 3.0], "bins": [-3.546875, -3.44671630859375, -3.3465576171875, -3.24639892578125, -3.146240234375, -3.04608154296875, -2.9459228515625, -2.84576416015625, -2.74560546875, -2.64544677734375, -2.5452880859375, -2.44512939453125, -2.344970703125, -2.24481201171875, -2.1446533203125, -2.04449462890625, -1.9443359375, -1.84417724609375, -1.7440185546875, -1.64385986328125, -1.543701171875, -1.44354248046875, -1.3433837890625, -1.24322509765625, -1.14306640625, -1.04290771484375, -0.9427490234375, -0.84259033203125, -0.742431640625, -0.64227294921875, -0.5421142578125, -0.44195556640625, -0.341796875, -0.24163818359375, -0.1414794921875, -0.04132080078125, 0.058837890625, 0.15899658203125, 0.2591552734375, 0.35931396484375, 0.45947265625, 0.55963134765625, 0.6597900390625, 0.75994873046875, 0.860107421875, 0.96026611328125, 1.0604248046875, 1.16058349609375, 1.2607421875, 1.36090087890625, 1.4610595703125, 1.56121826171875, 1.661376953125, 1.76153564453125, 1.8616943359375, 1.96185302734375, 2.06201171875, 2.16217041015625, 2.2623291015625, 2.36248779296875, 2.462646484375, 2.56280517578125, 2.6629638671875, 2.76312255859375, 2.86328125]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0, 5.0, 3.0, 7.0, 5.0, 11.0, 9.0, 9.0, 18.0, 16.0, 26.0, 17.0, 23.0, 36.0, 47.0, 42.0, 43.0, 46.0, 45.0, 43.0, 43.0, 58.0, 44.0, 40.0, 39.0, 51.0, 32.0, 43.0, 30.0, 36.0, 19.0, 24.0, 17.0, 12.0, 17.0, 11.0, 11.0, 10.0, 4.0, 6.0, 5.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3291015625, -1.28369140625, -1.23828125, -1.19287109375, -1.1474609375, -1.10205078125, -1.056640625, -1.01123046875, -0.9658203125, -0.92041015625, -0.875, -0.82958984375, -0.7841796875, -0.73876953125, -0.693359375, -0.64794921875, -0.6025390625, -0.55712890625, -0.51171875, -0.46630859375, -0.4208984375, -0.37548828125, -0.330078125, -0.28466796875, -0.2392578125, -0.19384765625, -0.1484375, -0.10302734375, -0.0576171875, -0.01220703125, 0.033203125, 0.07861328125, 0.1240234375, 0.16943359375, 0.21484375, 0.26025390625, 0.3056640625, 0.35107421875, 0.396484375, 0.44189453125, 0.4873046875, 0.53271484375, 0.578125, 0.62353515625, 0.6689453125, 0.71435546875, 0.759765625, 0.80517578125, 0.8505859375, 0.89599609375, 0.94140625, 0.98681640625, 1.0322265625, 1.07763671875, 1.123046875, 1.16845703125, 1.2138671875, 1.25927734375, 1.3046875, 1.35009765625, 1.3955078125, 1.44091796875, 1.486328125, 1.53173828125, 1.5771484375]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 6.0, 9.0, 6.0, 25.0, 43.0, 79.0, 162.0, 439.0, 1020.0, 3832.0, 56127.0, 3874996.0, 248223.0, 6838.0, 1478.0, 577.0, 237.0, 81.0, 40.0, 19.0, 11.0, 7.0, 9.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.09765625, -6.8734130859375, -6.649169921875, -6.4249267578125, -6.20068359375, -5.9764404296875, -5.752197265625, -5.5279541015625, -5.3037109375, -5.0794677734375, -4.855224609375, -4.6309814453125, -4.40673828125, -4.1824951171875, -3.958251953125, -3.7340087890625, -3.509765625, -3.2855224609375, -3.061279296875, -2.8370361328125, -2.61279296875, -2.3885498046875, -2.164306640625, -1.9400634765625, -1.7158203125, -1.4915771484375, -1.267333984375, -1.0430908203125, -0.81884765625, -0.5946044921875, -0.370361328125, -0.1461181640625, 0.078125, 0.3023681640625, 0.526611328125, 0.7508544921875, 0.97509765625, 1.1993408203125, 1.423583984375, 1.6478271484375, 1.8720703125, 2.0963134765625, 2.320556640625, 2.5447998046875, 2.76904296875, 2.9932861328125, 3.217529296875, 3.4417724609375, 3.666015625, 3.8902587890625, 4.114501953125, 4.3387451171875, 4.56298828125, 4.7872314453125, 5.011474609375, 5.2357177734375, 5.4599609375, 5.6842041015625, 5.908447265625, 6.1326904296875, 6.35693359375, 6.5811767578125, 6.805419921875, 7.0296630859375, 7.25390625]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 3.0, 4.0, 9.0, 4.0, 19.0, 16.0, 36.0, 54.0, 100.0, 131.0, 221.0, 363.0, 474.0, 660.0, 606.0, 484.0, 330.0, 194.0, 127.0, 98.0, 46.0, 29.0, 19.0, 18.0, 14.0, 8.0, 3.0, 1.0, 3.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1357421875, -1.099029541015625, -1.06231689453125, -1.025604248046875, -0.9888916015625, -0.952178955078125, -0.91546630859375, -0.878753662109375, -0.842041015625, -0.805328369140625, -0.76861572265625, -0.731903076171875, -0.6951904296875, -0.658477783203125, -0.62176513671875, -0.585052490234375, -0.54833984375, -0.511627197265625, -0.47491455078125, -0.438201904296875, -0.4014892578125, -0.364776611328125, -0.32806396484375, -0.291351318359375, -0.254638671875, -0.217926025390625, -0.18121337890625, -0.144500732421875, -0.1077880859375, -0.071075439453125, -0.03436279296875, 0.002349853515625, 0.0390625, 0.075775146484375, 0.11248779296875, 0.149200439453125, 0.1859130859375, 0.222625732421875, 0.25933837890625, 0.296051025390625, 0.332763671875, 0.369476318359375, 0.40618896484375, 0.442901611328125, 0.4796142578125, 0.516326904296875, 0.55303955078125, 0.589752197265625, 0.62646484375, 0.663177490234375, 0.69989013671875, 0.736602783203125, 0.7733154296875, 0.810028076171875, 0.84674072265625, 0.883453369140625, 0.920166015625, 0.956878662109375, 0.99359130859375, 1.030303955078125, 1.0670166015625, 1.103729248046875, 1.14044189453125, 1.177154541015625, 1.2138671875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 6.0, 6.0, 4.0, 13.0, 14.0, 13.0, 17.0, 15.0, 29.0, 25.0, 35.0, 31.0, 45.0, 44.0, 45.0, 49.0, 55.0, 40.0, 46.0, 57.0, 49.0, 44.0, 45.0, 57.0, 43.0, 27.0, 32.0, 23.0, 25.0, 21.0, 14.0, 6.0, 11.0, 6.0, 6.0, 4.0, 2.0, 6.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7463939189910889, -1.6785998344421387, -1.610805869102478, -1.5430117845535278, -1.4752177000045776, -1.407423734664917, -1.3396296501159668, -1.2718355655670166, -1.2040414810180664, -1.1362473964691162, -1.0684534311294556, -1.0006593465805054, -0.9328652620315552, -0.8650712370872498, -0.7972772121429443, -0.7294831275939941, -0.6616891622543335, -0.5938951373100281, -0.5261010527610779, -0.45830702781677246, -0.39051297307014465, -0.32271891832351685, -0.2549248933792114, -0.18713083863258362, -0.11933678388595581, -0.0515427365899086, 0.01625131070613861, 0.08404535055160522, 0.15183940529823303, 0.21963346004486084, 0.28742748498916626, 0.35522153973579407, 0.4230155944824219, 0.4908096492290497, 0.5586037039756775, 0.6263977289199829, 0.6941918134689331, 0.7619858384132385, 0.829779863357544, 0.8975739479064941, 0.9653679728507996, 1.033161997795105, 1.1009560823440552, 1.1687500476837158, 1.236544132232666, 1.3043382167816162, 1.3721323013305664, 1.439926266670227, 1.5077203512191772, 1.5755144357681274, 1.643308401107788, 1.7111024856567383, 1.7788965702056885, 1.8466906547546387, 1.9144846200942993, 1.9822787046432495, 2.05007266998291, 2.1178667545318604, 2.1856608390808105, 2.2534546852111816, 2.321248769760132, 2.389042854309082, 2.4568369388580322, 2.5246310234069824, 2.5924251079559326]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 4.0, 5.0, 2.0, 16.0, 4.0, 11.0, 13.0, 12.0, 18.0, 16.0, 19.0, 28.0, 29.0, 35.0, 40.0, 32.0, 42.0, 38.0, 53.0, 32.0, 51.0, 52.0, 41.0, 45.0, 39.0, 36.0, 30.0, 34.0, 29.0, 36.0, 26.0, 21.0, 24.0, 22.0, 11.0, 12.0, 7.0, 9.0, 9.0, 7.0, 3.0, 10.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8354744911193848, -1.7747690677642822, -1.7140636444091797, -1.6533582210540771, -1.5926527976989746, -1.531947374343872, -1.4712419509887695, -1.410536527633667, -1.3498311042785645, -1.289125680923462, -1.2284202575683594, -1.1677148342132568, -1.1070094108581543, -1.0463039875030518, -0.985598623752594, -0.9248932003974915, -0.8641878366470337, -0.8034824132919312, -0.7427769899368286, -0.6820715665817261, -0.6213661432266235, -0.560660719871521, -0.49995535612106323, -0.4392499327659607, -0.37854450941085815, -0.3178390860557556, -0.2571336627006531, -0.19642826914787292, -0.13572284579277039, -0.07501742243766785, -0.014312028884887695, 0.046393394470214844, 0.10709881782531738, 0.16780424118041992, 0.22850964963436127, 0.2892150580883026, 0.34992048144340515, 0.4106259047985077, 0.47133129835128784, 0.5320367217063904, 0.5927421450614929, 0.6534475684165955, 0.714152991771698, 0.7748583555221558, 0.8355637788772583, 0.8962692022323608, 0.9569746255874634, 1.017680048942566, 1.0783854722976685, 1.139090895652771, 1.1997963190078735, 1.260501742362976, 1.3212071657180786, 1.3819125890731812, 1.4426178932189941, 1.5033233165740967, 1.5640287399291992, 1.6247341632843018, 1.6854395866394043, 1.7461450099945068, 1.8068504333496094, 1.867555856704712, 1.9282612800598145, 1.988966703414917, 2.0496721267700195]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 6.0, 3.0, 6.0, 7.0, 8.0, 18.0, 12.0, 16.0, 31.0, 40.0, 40.0, 49.0, 80.0, 96.0, 116.0, 173.0, 258.0, 356.0, 671.0, 1532.0, 5076.0, 24704.0, 151521.0, 532366.0, 272644.0, 45690.0, 8434.0, 2223.0, 842.0, 445.0, 296.0, 200.0, 147.0, 96.0, 94.0, 66.0, 37.0, 46.0, 27.0, 18.0, 11.0, 16.0, 13.0, 10.0, 6.0, 5.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.7099609375, -0.6875457763671875, -0.665130615234375, -0.6427154541015625, -0.62030029296875, -0.5978851318359375, -0.575469970703125, -0.5530548095703125, -0.5306396484375, -0.5082244873046875, -0.485809326171875, -0.4633941650390625, -0.44097900390625, -0.4185638427734375, -0.396148681640625, -0.3737335205078125, -0.351318359375, -0.3289031982421875, -0.306488037109375, -0.2840728759765625, -0.26165771484375, -0.2392425537109375, -0.216827392578125, -0.1944122314453125, -0.1719970703125, -0.1495819091796875, -0.127166748046875, -0.1047515869140625, -0.08233642578125, -0.0599212646484375, -0.037506103515625, -0.0150909423828125, 0.00732421875, 0.0297393798828125, 0.052154541015625, 0.0745697021484375, 0.09698486328125, 0.1194000244140625, 0.141815185546875, 0.1642303466796875, 0.1866455078125, 0.2090606689453125, 0.231475830078125, 0.2538909912109375, 0.27630615234375, 0.2987213134765625, 0.321136474609375, 0.3435516357421875, 0.365966796875, 0.3883819580078125, 0.410797119140625, 0.4332122802734375, 0.45562744140625, 0.4780426025390625, 0.500457763671875, 0.5228729248046875, 0.5452880859375, 0.5677032470703125, 0.590118408203125, 0.6125335693359375, 0.63494873046875, 0.6573638916015625, 0.679779052734375, 0.7021942138671875, 0.724609375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 3.0, 5.0, 10.0, 9.0, 8.0, 8.0, 8.0, 11.0, 18.0, 11.0, 24.0, 24.0, 28.0, 27.0, 33.0, 36.0, 33.0, 34.0, 39.0, 33.0, 51.0, 29.0, 40.0, 37.0, 43.0, 42.0, 37.0, 37.0, 28.0, 35.0, 27.0, 30.0, 22.0, 27.0, 15.0, 16.0, 17.0, 15.0, 5.0, 6.0, 10.0, 12.0, 6.0, 4.0, 4.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.189453125, -1.1529083251953125, -1.116363525390625, -1.0798187255859375, -1.04327392578125, -1.0067291259765625, -0.970184326171875, -0.9336395263671875, -0.8970947265625, -0.8605499267578125, -0.824005126953125, -0.7874603271484375, -0.75091552734375, -0.7143707275390625, -0.677825927734375, -0.6412811279296875, -0.604736328125, -0.5681915283203125, -0.531646728515625, -0.4951019287109375, -0.45855712890625, -0.4220123291015625, -0.385467529296875, -0.3489227294921875, -0.3123779296875, -0.2758331298828125, -0.239288330078125, -0.2027435302734375, -0.16619873046875, -0.1296539306640625, -0.093109130859375, -0.0565643310546875, -0.02001953125, 0.0165252685546875, 0.053070068359375, 0.0896148681640625, 0.12615966796875, 0.1627044677734375, 0.199249267578125, 0.2357940673828125, 0.2723388671875, 0.3088836669921875, 0.345428466796875, 0.3819732666015625, 0.41851806640625, 0.4550628662109375, 0.491607666015625, 0.5281524658203125, 0.564697265625, 0.6012420654296875, 0.637786865234375, 0.6743316650390625, 0.71087646484375, 0.7474212646484375, 0.783966064453125, 0.8205108642578125, 0.8570556640625, 0.8936004638671875, 0.930145263671875, 0.9666900634765625, 1.00323486328125, 1.0397796630859375, 1.076324462890625, 1.1128692626953125, 1.1494140625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 1.0, 3.0, 4.0, 3.0, 10.0, 15.0, 16.0, 24.0, 30.0, 48.0, 74.0, 104.0, 160.0, 264.0, 417.0, 626.0, 924.0, 1522.0, 2458.0, 4009.0, 6354.0, 10138.0, 16767.0, 27884.0, 46265.0, 76014.0, 117751.0, 160462.0, 173274.0, 144591.0, 99211.0, 62356.0, 37745.0, 22874.0, 13783.0, 8311.0, 5141.0, 3243.0, 2059.0, 1314.0, 800.0, 555.0, 328.0, 201.0, 134.0, 104.0, 67.0, 38.0, 35.0, 16.0, 17.0, 9.0, 5.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1829833984375, -0.17713546752929688, -0.17128753662109375, -0.16543960571289062, -0.1595916748046875, -0.15374374389648438, -0.14789581298828125, -0.14204788208007812, -0.136199951171875, -0.13035202026367188, -0.12450408935546875, -0.11865615844726562, -0.1128082275390625, -0.10696029663085938, -0.10111236572265625, -0.09526443481445312, -0.08941650390625, -0.08356857299804688, -0.07772064208984375, -0.07187271118164062, -0.0660247802734375, -0.060176849365234375, -0.05432891845703125, -0.048480987548828125, -0.042633056640625, -0.036785125732421875, -0.03093719482421875, -0.025089263916015625, -0.0192413330078125, -0.013393402099609375, -0.00754547119140625, -0.001697540283203125, 0.004150390625, 0.009998321533203125, 0.01584625244140625, 0.021694183349609375, 0.0275421142578125, 0.033390045166015625, 0.03923797607421875, 0.045085906982421875, 0.050933837890625, 0.056781768798828125, 0.06262969970703125, 0.06847763061523438, 0.0743255615234375, 0.08017349243164062, 0.08602142333984375, 0.09186935424804688, 0.09771728515625, 0.10356521606445312, 0.10941314697265625, 0.11526107788085938, 0.1211090087890625, 0.12695693969726562, 0.13280487060546875, 0.13865280151367188, 0.144500732421875, 0.15034866333007812, 0.15619659423828125, 0.16204452514648438, 0.1678924560546875, 0.17374038696289062, 0.17958831787109375, 0.18543624877929688, 0.1912841796875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 10.0, 11.0, 9.0, 8.0, 9.0, 13.0, 16.0, 22.0, 30.0, 18.0, 34.0, 26.0, 32.0, 33.0, 44.0, 45.0, 49.0, 47.0, 54.0, 60.0, 42.0, 37.0, 48.0, 35.0, 36.0, 40.0, 25.0, 29.0, 16.0, 14.0, 12.0, 23.0, 17.0, 9.0, 6.0, 7.0, 5.0, 5.0, 7.0, 7.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.07421875, -2.975982666015625, -2.87774658203125, -2.779510498046875, -2.6812744140625, -2.583038330078125, -2.48480224609375, -2.386566162109375, -2.288330078125, -2.190093994140625, -2.09185791015625, -1.993621826171875, -1.8953857421875, -1.797149658203125, -1.69891357421875, -1.600677490234375, -1.50244140625, -1.404205322265625, -1.30596923828125, -1.207733154296875, -1.1094970703125, -1.011260986328125, -0.91302490234375, -0.814788818359375, -0.716552734375, -0.618316650390625, -0.52008056640625, -0.421844482421875, -0.3236083984375, -0.225372314453125, -0.12713623046875, -0.028900146484375, 0.0693359375, 0.167572021484375, 0.26580810546875, 0.364044189453125, 0.4622802734375, 0.560516357421875, 0.65875244140625, 0.756988525390625, 0.855224609375, 0.953460693359375, 1.05169677734375, 1.149932861328125, 1.2481689453125, 1.346405029296875, 1.44464111328125, 1.542877197265625, 1.64111328125, 1.739349365234375, 1.83758544921875, 1.935821533203125, 2.0340576171875, 2.132293701171875, 2.23052978515625, 2.328765869140625, 2.427001953125, 2.525238037109375, 2.62347412109375, 2.721710205078125, 2.8199462890625, 2.918182373046875, 3.01641845703125, 3.114654541015625, 3.212890625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 6.0, 9.0, 9.0, 18.0, 23.0, 48.0, 84.0, 119.0, 172.0, 305.0, 497.0, 833.0, 1946.0, 6050.0, 38631.0, 401246.0, 527401.0, 58638.0, 7983.0, 2241.0, 949.0, 532.0, 290.0, 171.0, 131.0, 86.0, 48.0, 27.0, 16.0, 20.0, 9.0, 7.0, 7.0, 6.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.107421875, -0.10345649719238281, -0.09949111938476562, -0.09552574157714844, -0.09156036376953125, -0.08759498596191406, -0.08362960815429688, -0.07966423034667969, -0.0756988525390625, -0.07173347473144531, -0.06776809692382812, -0.06380271911621094, -0.05983734130859375, -0.05587196350097656, -0.051906585693359375, -0.04794120788574219, -0.043975830078125, -0.04001045227050781, -0.036045074462890625, -0.03207969665527344, -0.02811431884765625, -0.024148941040039062, -0.020183563232421875, -0.016218185424804688, -0.0122528076171875, -0.008287429809570312, -0.004322052001953125, -0.0003566741943359375, 0.00360870361328125, 0.0075740814208984375, 0.011539459228515625, 0.015504837036132812, 0.01947021484375, 0.023435592651367188, 0.027400970458984375, 0.03136634826660156, 0.03533172607421875, 0.03929710388183594, 0.043262481689453125, 0.04722785949707031, 0.0511932373046875, 0.05515861511230469, 0.059123992919921875, 0.06308937072753906, 0.06705474853515625, 0.07102012634277344, 0.07498550415039062, 0.07895088195800781, 0.082916259765625, 0.08688163757324219, 0.09084701538085938, 0.09481239318847656, 0.09877777099609375, 0.10274314880371094, 0.10670852661132812, 0.11067390441894531, 0.1146392822265625, 0.11860466003417969, 0.12257003784179688, 0.12653541564941406, 0.13050079345703125, 0.13446617126464844, 0.13843154907226562, 0.1423969268798828, 0.1463623046875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 11.0, 27.0, 29.0, 71.0, 113.0, 146.0, 166.0, 146.0, 118.0, 76.0, 45.0, 23.0, 14.0, 10.0, 3.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0001043081283569336, -0.00010160915553569794, -9.891018271446228e-05, -9.621120989322662e-05, -9.351223707199097e-05, -9.081326425075531e-05, -8.811429142951965e-05, -8.5415318608284e-05, -8.271634578704834e-05, -8.001737296581268e-05, -7.731840014457703e-05, -7.461942732334137e-05, -7.192045450210571e-05, -6.922148168087006e-05, -6.65225088596344e-05, -6.382353603839874e-05, -6.112456321716309e-05, -5.842559039592743e-05, -5.572661757469177e-05, -5.3027644753456116e-05, -5.032867193222046e-05, -4.76296991109848e-05, -4.4930726289749146e-05, -4.223175346851349e-05, -3.953278064727783e-05, -3.6833807826042175e-05, -3.413483500480652e-05, -3.143586218357086e-05, -2.8736889362335205e-05, -2.603791654109955e-05, -2.333894371986389e-05, -2.0639970898628235e-05, -1.7940998077392578e-05, -1.5242025256156921e-05, -1.2543052434921265e-05, -9.844079613685608e-06, -7.145106792449951e-06, -4.4461339712142944e-06, -1.7471611499786377e-06, 9.51811671257019e-07, 3.6507844924926758e-06, 6.3497573137283325e-06, 9.04873013496399e-06, 1.1747702956199646e-05, 1.4446675777435303e-05, 1.714564859867096e-05, 1.9844621419906616e-05, 2.2543594241142273e-05, 2.524256706237793e-05, 2.7941539883613586e-05, 3.064051270484924e-05, 3.33394855260849e-05, 3.603845834732056e-05, 3.873743116855621e-05, 4.143640398979187e-05, 4.413537681102753e-05, 4.6834349632263184e-05, 4.953332245349884e-05, 5.22322952747345e-05, 5.4931268095970154e-05, 5.763024091720581e-05, 6.032921373844147e-05, 6.302818655967712e-05, 6.572715938091278e-05, 6.842613220214844e-05]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 9.0, 3.0, 24.0, 25.0, 46.0, 56.0, 105.0, 157.0, 300.0, 494.0, 960.0, 1662.0, 3381.0, 6816.0, 15008.0, 35784.0, 94088.0, 242555.0, 350005.0, 180454.0, 67730.0, 26313.0, 11214.0, 5330.0, 2578.0, 1394.0, 845.0, 457.0, 284.0, 162.0, 103.0, 76.0, 51.0, 27.0, 18.0, 12.0, 10.0, 6.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.07366943359375, -0.07152271270751953, -0.06937599182128906, -0.0672292709350586, -0.06508255004882812, -0.06293582916259766, -0.06078910827636719, -0.05864238739013672, -0.05649566650390625, -0.05434894561767578, -0.05220222473144531, -0.050055503845214844, -0.047908782958984375, -0.045762062072753906, -0.04361534118652344, -0.04146862030029297, -0.0393218994140625, -0.03717517852783203, -0.03502845764160156, -0.032881736755371094, -0.030735015869140625, -0.028588294982910156, -0.026441574096679688, -0.02429485321044922, -0.02214813232421875, -0.02000141143798828, -0.017854690551757812, -0.015707969665527344, -0.013561248779296875, -0.011414527893066406, -0.009267807006835938, -0.007121086120605469, -0.004974365234375, -0.0028276443481445312, -0.0006809234619140625, 0.0014657974243164062, 0.003612518310546875, 0.005759239196777344, 0.007905960083007812, 0.010052680969238281, 0.01219940185546875, 0.014346122741699219, 0.016492843627929688, 0.018639564514160156, 0.020786285400390625, 0.022933006286621094, 0.025079727172851562, 0.02722644805908203, 0.0293731689453125, 0.03151988983154297, 0.03366661071777344, 0.035813331604003906, 0.037960052490234375, 0.040106773376464844, 0.04225349426269531, 0.04440021514892578, 0.04654693603515625, 0.04869365692138672, 0.05084037780761719, 0.052987098693847656, 0.055133819580078125, 0.057280540466308594, 0.05942726135253906, 0.06157398223876953, 0.063720703125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 5.0, 8.0, 8.0, 11.0, 11.0, 19.0, 18.0, 21.0, 36.0, 45.0, 50.0, 67.0, 76.0, 106.0, 98.0, 86.0, 97.0, 65.0, 40.0, 24.0, 13.0, 23.0, 11.0, 10.0, 4.0, 11.0, 6.0, 7.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.027587890625, -0.02662515640258789, -0.02566242218017578, -0.024699687957763672, -0.023736953735351562, -0.022774219512939453, -0.021811485290527344, -0.020848751068115234, -0.019886016845703125, -0.018923282623291016, -0.017960548400878906, -0.016997814178466797, -0.016035079956054688, -0.015072345733642578, -0.014109611511230469, -0.01314687728881836, -0.01218414306640625, -0.01122140884399414, -0.010258674621582031, -0.009295940399169922, -0.008333206176757812, -0.007370471954345703, -0.006407737731933594, -0.005445003509521484, -0.004482269287109375, -0.0035195350646972656, -0.0025568008422851562, -0.0015940666198730469, -0.0006313323974609375, 0.0003314018249511719, 0.0012941360473632812, 0.0022568702697753906, 0.0032196044921875, 0.004182338714599609, 0.005145072937011719, 0.006107807159423828, 0.0070705413818359375, 0.008033275604248047, 0.008996009826660156, 0.009958744049072266, 0.010921478271484375, 0.011884212493896484, 0.012846946716308594, 0.013809680938720703, 0.014772415161132812, 0.015735149383544922, 0.01669788360595703, 0.01766061782836914, 0.01862335205078125, 0.01958608627319336, 0.02054882049560547, 0.021511554718017578, 0.022474288940429688, 0.023437023162841797, 0.024399757385253906, 0.025362491607666016, 0.026325225830078125, 0.027287960052490234, 0.028250694274902344, 0.029213428497314453, 0.030176162719726562, 0.031138896942138672, 0.03210163116455078, 0.03306436538696289, 0.034027099609375]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 10.0, 14.0, 19.0, 20.0, 26.0, 40.0, 34.0, 51.0, 52.0, 48.0, 56.0, 55.0, 69.0, 56.0, 64.0, 65.0, 39.0, 48.0, 60.0, 48.0, 34.0, 27.0, 16.0, 14.0, 9.0, 15.0, 4.0, 2.0, 0.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0538415908813477, -1.0038965940475464, -0.9539515972137451, -0.9040066003799438, -0.8540616035461426, -0.8041166067123413, -0.7541716694831848, -0.7042266726493835, -0.6542816758155823, -0.604336678981781, -0.5543916821479797, -0.5044467449188232, -0.4545017182826996, -0.4045567214488983, -0.35461175441741943, -0.30466675758361816, -0.2547217607498169, -0.20477676391601562, -0.15483178198337555, -0.10488680005073547, -0.054941803216934204, -0.004996806383132935, 0.04494816064834595, 0.09489315748214722, 0.1448381543159485, 0.19478315114974976, 0.24472813308238983, 0.2946731150150299, 0.3446181118488312, 0.39456310868263245, 0.44450807571411133, 0.4944530725479126, 0.5443980693817139, 0.5943430662155151, 0.6442880630493164, 0.6942330598831177, 0.744178056716919, 0.7941230535507202, 0.8440679907798767, 0.894012987613678, 0.9439579844474792, 0.9939029812812805, 1.043847918510437, 1.0937929153442383, 1.1437379121780396, 1.1936829090118408, 1.243627905845642, 1.2935729026794434, 1.3435178995132446, 1.393462896347046, 1.4434078931808472, 1.4933528900146484, 1.5432978868484497, 1.593242883682251, 1.6431877613067627, 1.6931328773498535, 1.7430777549743652, 1.7930227518081665, 1.8429677486419678, 1.892912745475769, 1.9428577423095703, 1.9928027391433716, 2.042747735977173, 2.0926926136016846, 2.1426377296447754]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 5.0, 4.0, 9.0, 6.0, 6.0, 9.0, 11.0, 16.0, 20.0, 15.0, 17.0, 29.0, 28.0, 40.0, 41.0, 44.0, 36.0, 43.0, 50.0, 50.0, 42.0, 59.0, 46.0, 44.0, 39.0, 42.0, 27.0, 35.0, 27.0, 32.0, 26.0, 21.0, 17.0, 14.0, 10.0, 14.0, 3.0, 9.0, 6.0, 10.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1705529689788818, -1.1307274103164673, -1.0909018516540527, -1.0510761737823486, -1.011250615119934, -0.9714250564575195, -0.931599497795105, -0.8917739391326904, -0.8519483208656311, -0.8121227622032166, -0.7722971439361572, -0.7324715852737427, -0.6926460266113281, -0.6528204083442688, -0.6129948496818542, -0.5731692314147949, -0.5333436727523804, -0.49351808428764343, -0.4536924958229065, -0.41386693716049194, -0.374041348695755, -0.33421576023101807, -0.2943902015686035, -0.2545646131038666, -0.21473902463912964, -0.1749134361743927, -0.13508786261081696, -0.09526228159666061, -0.05543670058250427, -0.015611112117767334, 0.02421446144580841, 0.06404003500938416, 0.1038656234741211, 0.14369121193885803, 0.18351678550243378, 0.22334235906600952, 0.26316794753074646, 0.3029935359954834, 0.34281909465789795, 0.3826446831226349, 0.4224702715873718, 0.46229586005210876, 0.5021214485168457, 0.5419470071792603, 0.5817725658416748, 0.6215981841087341, 0.6614237427711487, 0.701249361038208, 0.7410749197006226, 0.7809004783630371, 0.8207260966300964, 0.860551655292511, 0.9003772735595703, 0.9402028322219849, 0.9800283908843994, 1.019853949546814, 1.0596795082092285, 1.099505066871643, 1.1393306255340576, 1.1791563034057617, 1.2189818620681763, 1.2588074207305908, 1.2986329793930054, 1.33845853805542, 1.378284215927124]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 7.0, 7.0, 13.0, 16.0, 29.0, 30.0, 37.0, 83.0, 127.0, 211.0, 350.0, 662.0, 1368.0, 2851.0, 6833.0, 16991.0, 44322.0, 111464.0, 232892.0, 299522.0, 191745.0, 83593.0, 32938.0, 12733.0, 4993.0, 2269.0, 1124.0, 570.0, 322.0, 160.0, 107.0, 69.0, 37.0, 32.0, 22.0, 9.0, 6.0, 3.0, 3.0, 7.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5185546875, -1.4586334228515625, -1.398712158203125, -1.3387908935546875, -1.27886962890625, -1.2189483642578125, -1.159027099609375, -1.0991058349609375, -1.0391845703125, -0.9792633056640625, -0.919342041015625, -0.8594207763671875, -0.79949951171875, -0.7395782470703125, -0.679656982421875, -0.6197357177734375, -0.559814453125, -0.4998931884765625, -0.439971923828125, -0.3800506591796875, -0.32012939453125, -0.2602081298828125, -0.200286865234375, -0.1403656005859375, -0.0804443359375, -0.0205230712890625, 0.039398193359375, 0.0993194580078125, 0.15924072265625, 0.2191619873046875, 0.279083251953125, 0.3390045166015625, 0.39892578125, 0.4588470458984375, 0.518768310546875, 0.5786895751953125, 0.63861083984375, 0.6985321044921875, 0.758453369140625, 0.8183746337890625, 0.8782958984375, 0.9382171630859375, 0.998138427734375, 1.0580596923828125, 1.11798095703125, 1.1779022216796875, 1.237823486328125, 1.2977447509765625, 1.357666015625, 1.4175872802734375, 1.477508544921875, 1.5374298095703125, 1.59735107421875, 1.6572723388671875, 1.717193603515625, 1.7771148681640625, 1.8370361328125, 1.8969573974609375, 1.956878662109375, 2.0167999267578125, 2.07672119140625, 2.1366424560546875, 2.196563720703125, 2.2564849853515625, 2.31640625]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 7.0, 4.0, 5.0, 13.0, 10.0, 6.0, 12.0, 14.0, 27.0, 18.0, 21.0, 25.0, 30.0, 33.0, 38.0, 47.0, 51.0, 40.0, 53.0, 46.0, 56.0, 48.0, 50.0, 42.0, 35.0, 39.0, 31.0, 34.0, 23.0, 28.0, 24.0, 21.0, 15.0, 11.0, 12.0, 12.0, 7.0, 6.0, 2.0, 2.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.021484375, -1.954132080078125, -1.88677978515625, -1.819427490234375, -1.7520751953125, -1.684722900390625, -1.61737060546875, -1.550018310546875, -1.482666015625, -1.415313720703125, -1.34796142578125, -1.280609130859375, -1.2132568359375, -1.145904541015625, -1.07855224609375, -1.011199951171875, -0.94384765625, -0.876495361328125, -0.80914306640625, -0.741790771484375, -0.6744384765625, -0.607086181640625, -0.53973388671875, -0.472381591796875, -0.405029296875, -0.337677001953125, -0.27032470703125, -0.202972412109375, -0.1356201171875, -0.068267822265625, -0.00091552734375, 0.066436767578125, 0.1337890625, 0.201141357421875, 0.26849365234375, 0.335845947265625, 0.4031982421875, 0.470550537109375, 0.53790283203125, 0.605255126953125, 0.672607421875, 0.739959716796875, 0.80731201171875, 0.874664306640625, 0.9420166015625, 1.009368896484375, 1.07672119140625, 1.144073486328125, 1.21142578125, 1.278778076171875, 1.34613037109375, 1.413482666015625, 1.4808349609375, 1.548187255859375, 1.61553955078125, 1.682891845703125, 1.750244140625, 1.817596435546875, 1.88494873046875, 1.952301025390625, 2.0196533203125, 2.087005615234375, 2.15435791015625, 2.221710205078125, 2.2890625]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 7.0, 3.0, 9.0, 9.0, 10.0, 12.0, 18.0, 29.0, 36.0, 51.0, 84.0, 118.0, 179.0, 310.0, 507.0, 1128.0, 2537.0, 6659.0, 20785.0, 72843.0, 236226.0, 401316.0, 212879.0, 63536.0, 18543.0, 6094.0, 2249.0, 1019.0, 505.0, 291.0, 190.0, 107.0, 91.0, 52.0, 35.0, 23.0, 20.0, 10.0, 12.0, 10.0, 6.0, 4.0, 5.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-3.3203125, -3.229217529296875, -3.13812255859375, -3.047027587890625, -2.9559326171875, -2.864837646484375, -2.77374267578125, -2.682647705078125, -2.591552734375, -2.500457763671875, -2.40936279296875, -2.318267822265625, -2.2271728515625, -2.136077880859375, -2.04498291015625, -1.953887939453125, -1.86279296875, -1.771697998046875, -1.68060302734375, -1.589508056640625, -1.4984130859375, -1.407318115234375, -1.31622314453125, -1.225128173828125, -1.134033203125, -1.042938232421875, -0.95184326171875, -0.860748291015625, -0.7696533203125, -0.678558349609375, -0.58746337890625, -0.496368408203125, -0.4052734375, -0.314178466796875, -0.22308349609375, -0.131988525390625, -0.0408935546875, 0.050201416015625, 0.14129638671875, 0.232391357421875, 0.323486328125, 0.414581298828125, 0.50567626953125, 0.596771240234375, 0.6878662109375, 0.778961181640625, 0.87005615234375, 0.961151123046875, 1.05224609375, 1.143341064453125, 1.23443603515625, 1.325531005859375, 1.4166259765625, 1.507720947265625, 1.59881591796875, 1.689910888671875, 1.781005859375, 1.872100830078125, 1.96319580078125, 2.054290771484375, 2.1453857421875, 2.236480712890625, 2.32757568359375, 2.418670654296875, 2.509765625]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 0.0, 2.0, 3.0, 0.0, 5.0, 1.0, 4.0, 8.0, 12.0, 19.0, 17.0, 12.0, 20.0, 24.0, 32.0, 39.0, 30.0, 44.0, 46.0, 41.0, 50.0, 45.0, 61.0, 57.0, 51.0, 48.0, 46.0, 41.0, 37.0, 31.0, 34.0, 30.0, 24.0, 23.0, 11.0, 15.0, 13.0, 8.0, 6.0, 8.0, 3.0, 7.0, 1.0, 2.0, 1.0, 2.0], "bins": [-3.501953125, -3.415771484375, -3.32958984375, -3.243408203125, -3.1572265625, -3.071044921875, -2.98486328125, -2.898681640625, -2.8125, -2.726318359375, -2.64013671875, -2.553955078125, -2.4677734375, -2.381591796875, -2.29541015625, -2.209228515625, -2.123046875, -2.036865234375, -1.95068359375, -1.864501953125, -1.7783203125, -1.692138671875, -1.60595703125, -1.519775390625, -1.43359375, -1.347412109375, -1.26123046875, -1.175048828125, -1.0888671875, -1.002685546875, -0.91650390625, -0.830322265625, -0.744140625, -0.657958984375, -0.57177734375, -0.485595703125, -0.3994140625, -0.313232421875, -0.22705078125, -0.140869140625, -0.0546875, 0.031494140625, 0.11767578125, 0.203857421875, 0.2900390625, 0.376220703125, 0.46240234375, 0.548583984375, 0.634765625, 0.720947265625, 0.80712890625, 0.893310546875, 0.9794921875, 1.065673828125, 1.15185546875, 1.238037109375, 1.32421875, 1.410400390625, 1.49658203125, 1.582763671875, 1.6689453125, 1.755126953125, 1.84130859375, 1.927490234375, 2.013671875]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 2.0, 3.0, 8.0, 5.0, 8.0, 24.0, 33.0, 40.0, 70.0, 96.0, 148.0, 296.0, 505.0, 1060.0, 2058.0, 4414.0, 9824.0, 23326.0, 57746.0, 134562.0, 254328.0, 308236.0, 144153.0, 62520.0, 25400.0, 10394.0, 4614.0, 2225.0, 1099.0, 573.0, 320.0, 195.0, 95.0, 70.0, 29.0, 24.0, 15.0, 15.0, 5.0, 8.0, 2.0, 1.0, 0.0, 2.0, 5.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.45556640625, -0.43988037109375, -0.4241943359375, -0.40850830078125, -0.392822265625, -0.37713623046875, -0.3614501953125, -0.34576416015625, -0.330078125, -0.31439208984375, -0.2987060546875, -0.28302001953125, -0.267333984375, -0.25164794921875, -0.2359619140625, -0.22027587890625, -0.20458984375, -0.18890380859375, -0.1732177734375, -0.15753173828125, -0.141845703125, -0.12615966796875, -0.1104736328125, -0.09478759765625, -0.0791015625, -0.06341552734375, -0.0477294921875, -0.03204345703125, -0.016357421875, -0.00067138671875, 0.0150146484375, 0.03070068359375, 0.04638671875, 0.06207275390625, 0.0777587890625, 0.09344482421875, 0.109130859375, 0.12481689453125, 0.1405029296875, 0.15618896484375, 0.171875, 0.18756103515625, 0.2032470703125, 0.21893310546875, 0.234619140625, 0.25030517578125, 0.2659912109375, 0.28167724609375, 0.29736328125, 0.31304931640625, 0.3287353515625, 0.34442138671875, 0.360107421875, 0.37579345703125, 0.3914794921875, 0.40716552734375, 0.4228515625, 0.43853759765625, 0.4542236328125, 0.46990966796875, 0.485595703125, 0.50128173828125, 0.5169677734375, 0.53265380859375, 0.54833984375]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 8.0, 3.0, 6.0, 7.0, 15.0, 15.0, 21.0, 28.0, 38.0, 45.0, 68.0, 73.0, 86.0, 165.0, 88.0, 70.0, 59.0, 47.0, 46.0, 24.0, 24.0, 14.0, 22.0, 4.0, 6.0, 4.0, 5.0, 3.0, 7.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001251697540283203, -0.00012028589844703674, -0.00011540204286575317, -0.0001105181872844696, -0.00010563433170318604, -0.00010075047612190247, -9.58666205406189e-05, -9.098276495933533e-05, -8.609890937805176e-05, -8.121505379676819e-05, -7.633119821548462e-05, -7.144734263420105e-05, -6.656348705291748e-05, -6.167963147163391e-05, -5.679577589035034e-05, -5.191192030906677e-05, -4.70280647277832e-05, -4.2144209146499634e-05, -3.7260353565216064e-05, -3.2376497983932495e-05, -2.7492642402648926e-05, -2.2608786821365356e-05, -1.7724931240081787e-05, -1.2841075658798218e-05, -7.957220077514648e-06, -3.073364496231079e-06, 1.8104910850524902e-06, 6.6943466663360596e-06, 1.1578202247619629e-05, 1.6462057828903198e-05, 2.1345913410186768e-05, 2.6229768991470337e-05, 3.1113624572753906e-05, 3.5997480154037476e-05, 4.0881335735321045e-05, 4.5765191316604614e-05, 5.0649046897888184e-05, 5.553290247917175e-05, 6.041675806045532e-05, 6.530061364173889e-05, 7.018446922302246e-05, 7.506832480430603e-05, 7.99521803855896e-05, 8.483603596687317e-05, 8.971989154815674e-05, 9.460374712944031e-05, 9.948760271072388e-05, 0.00010437145829200745, 0.00010925531387329102, 0.00011413916945457458, 0.00011902302503585815, 0.00012390688061714172, 0.0001287907361984253, 0.00013367459177970886, 0.00013855844736099243, 0.000143442302942276, 0.00014832615852355957, 0.00015321001410484314, 0.0001580938696861267, 0.00016297772526741028, 0.00016786158084869385, 0.00017274543642997742, 0.00017762929201126099, 0.00018251314759254456, 0.00018739700317382812]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 6.0, 8.0, 14.0, 23.0, 21.0, 32.0, 50.0, 74.0, 96.0, 142.0, 170.0, 298.0, 379.0, 621.0, 944.0, 1706.0, 2872.0, 5673.0, 11516.0, 27643.0, 77680.0, 215071.0, 400278.0, 189710.0, 66895.0, 24356.0, 10221.0, 5088.0, 2717.0, 1488.0, 962.0, 582.0, 380.0, 279.0, 182.0, 106.0, 79.0, 53.0, 41.0, 26.0, 22.0, 17.0, 12.0, 9.0, 3.0, 2.0, 5.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.67919921875, -0.6561203002929688, -0.6330413818359375, -0.6099624633789062, -0.586883544921875, -0.5638046264648438, -0.5407257080078125, -0.5176467895507812, -0.49456787109375, -0.47148895263671875, -0.4484100341796875, -0.42533111572265625, -0.402252197265625, -0.37917327880859375, -0.3560943603515625, -0.33301544189453125, -0.3099365234375, -0.28685760498046875, -0.2637786865234375, -0.24069976806640625, -0.217620849609375, -0.19454193115234375, -0.1714630126953125, -0.14838409423828125, -0.12530517578125, -0.10222625732421875, -0.0791473388671875, -0.05606842041015625, -0.032989501953125, -0.00991058349609375, 0.0131683349609375, 0.03624725341796875, 0.059326171875, 0.08240509033203125, 0.1054840087890625, 0.12856292724609375, 0.151641845703125, 0.17472076416015625, 0.1977996826171875, 0.22087860107421875, 0.24395751953125, 0.26703643798828125, 0.2901153564453125, 0.31319427490234375, 0.336273193359375, 0.35935211181640625, 0.3824310302734375, 0.40550994873046875, 0.4285888671875, 0.45166778564453125, 0.4747467041015625, 0.49782562255859375, 0.520904541015625, 0.5439834594726562, 0.5670623779296875, 0.5901412963867188, 0.61322021484375, 0.6362991333007812, 0.6593780517578125, 0.6824569702148438, 0.705535888671875, 0.7286148071289062, 0.7516937255859375, 0.7747726440429688, 0.7978515625]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 6.0, 4.0, 1.0, 7.0, 9.0, 14.0, 10.0, 10.0, 23.0, 23.0, 24.0, 40.0, 37.0, 72.0, 67.0, 74.0, 149.0, 74.0, 78.0, 56.0, 46.0, 40.0, 36.0, 28.0, 13.0, 10.0, 13.0, 9.0, 6.0, 6.0, 2.0, 3.0, 2.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.43701171875, -0.4227409362792969, -0.40847015380859375, -0.3941993713378906, -0.3799285888671875, -0.3656578063964844, -0.35138702392578125, -0.3371162414550781, -0.322845458984375, -0.3085746765136719, -0.29430389404296875, -0.2800331115722656, -0.2657623291015625, -0.2514915466308594, -0.23722076416015625, -0.22294998168945312, -0.20867919921875, -0.19440841674804688, -0.18013763427734375, -0.16586685180664062, -0.1515960693359375, -0.13732528686523438, -0.12305450439453125, -0.10878372192382812, -0.094512939453125, -0.08024215698242188, -0.06597137451171875, -0.051700592041015625, -0.0374298095703125, -0.023159027099609375, -0.00888824462890625, 0.005382537841796875, 0.0196533203125, 0.033924102783203125, 0.04819488525390625, 0.062465667724609375, 0.0767364501953125, 0.09100723266601562, 0.10527801513671875, 0.11954879760742188, 0.133819580078125, 0.14809036254882812, 0.16236114501953125, 0.17663192749023438, 0.1909027099609375, 0.20517349243164062, 0.21944427490234375, 0.23371505737304688, 0.24798583984375, 0.2622566223144531, 0.27652740478515625, 0.2907981872558594, 0.3050689697265625, 0.3193397521972656, 0.33361053466796875, 0.3478813171386719, 0.362152099609375, 0.3764228820800781, 0.39069366455078125, 0.4049644470214844, 0.4192352294921875, 0.4335060119628906, 0.44777679443359375, 0.4620475769042969, 0.476318359375]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 8.0, 10.0, 32.0, 48.0, 74.0, 97.0, 128.0, 132.0, 129.0, 111.0, 83.0, 64.0, 48.0, 15.0, 13.0, 3.0, 2.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0425164699554443, -2.838343620300293, -2.6341707706451416, -2.4299979209899902, -2.225825309753418, -2.0216522216796875, -1.8174796104431152, -1.6133067607879639, -1.4091339111328125, -1.2049610614776611, -1.0007882118225098, -0.796615481376648, -0.5924426317214966, -0.3882697820663452, -0.1840970516204834, 0.02007579803466797, 0.22424864768981934, 0.4284214675426483, 0.6325942873954773, 0.8367670774459839, 1.0409399271011353, 1.2451127767562866, 1.4492855072021484, 1.6534583568572998, 1.8576312065124512, 2.0618040561676025, 2.265976905822754, 2.470149517059326, 2.6743226051330566, 2.878495216369629, 3.0826680660247803, 3.2868409156799316, 3.491013526916504, 3.6951863765716553, 3.8993592262268066, 4.103531837463379, 4.307704925537109, 4.511877536773682, 4.716050148010254, 4.920223236083984, 5.124396324157715, 5.328568935394287, 5.532742023468018, 5.73691463470459, 5.94108772277832, 6.145260334014893, 6.349432945251465, 6.553606033325195, 6.757778644561768, 6.96195125579834, 7.16612434387207, 7.370296955108643, 7.574470043182373, 7.778642654418945, 7.982815742492676, 8.186988830566406, 8.39116096496582, 8.59533405303955, 8.799506187438965, 9.003679275512695, 9.207852363586426, 9.412025451660156, 9.61619758605957, 9.8203706741333, 10.024543762207031]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 5.0, 4.0, 7.0, 9.0, 9.0, 12.0, 14.0, 9.0, 22.0, 16.0, 27.0, 28.0, 27.0, 36.0, 30.0, 41.0, 38.0, 39.0, 47.0, 64.0, 45.0, 59.0, 46.0, 51.0, 43.0, 32.0, 44.0, 28.0, 31.0, 14.0, 26.0, 13.0, 16.0, 12.0, 12.0, 9.0, 11.0, 7.0, 7.0, 2.0, 2.0, 3.0, 0.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0], "bins": [-4.560827255249023, -4.430590629577637, -4.30035400390625, -4.170117378234863, -4.039880752563477, -3.90964412689209, -3.779407501220703, -3.6491708755493164, -3.5189342498779297, -3.388697624206543, -3.2584609985351562, -3.1282243728637695, -2.997987747192383, -2.867751121520996, -2.7375144958496094, -2.6072778701782227, -2.477041006088257, -2.34680438041687, -2.2165677547454834, -2.0863311290740967, -1.95609450340271, -1.8258578777313232, -1.695621132850647, -1.5653845071792603, -1.4351478815078735, -1.3049112558364868, -1.1746746301651, -1.0444378852844238, -0.9142013192176819, -0.7839646935462952, -0.6537280082702637, -0.523491382598877, -0.39325475692749023, -0.2630181312561035, -0.1327814757823944, -0.0025448203086853027, 0.12769180536270142, 0.25792843103408813, 0.38816511631011963, 0.5184017419815063, 0.6486383676528931, 0.7788749933242798, 0.9091116189956665, 1.0393483638763428, 1.1695849895477295, 1.2998216152191162, 1.430058240890503, 1.5602948665618896, 1.6905314922332764, 1.820768117904663, 1.9510047435760498, 2.0812413692474365, 2.2114779949188232, 2.34171462059021, 2.471951484680176, 2.6021881103515625, 2.732424736022949, 2.862661361694336, 2.9928979873657227, 3.1231346130371094, 3.253371238708496, 3.383607864379883, 3.5138444900512695, 3.6440811157226562, 3.774317741394043]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 4.0, 1.0, 0.0, 3.0, 2.0, 4.0, 2.0, 5.0, 9.0, 6.0, 9.0, 15.0, 21.0, 19.0, 36.0, 51.0, 70.0, 120.0, 200.0, 292.0, 455.0, 761.0, 1238.0, 2073.0, 3264.0, 5536.0, 9887.0, 1002119.0, 9941.0, 5648.0, 3506.0, 2052.0, 1191.0, 736.0, 459.0, 287.0, 192.0, 113.0, 84.0, 52.0, 34.0, 25.0, 20.0, 13.0, 15.0, 10.0, 9.0, 8.0, 4.0, 4.0, 1.0, 4.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7727837562561035, -3.6491355895996094, -3.5254874229431152, -3.401839256286621, -3.278191328048706, -3.154543161392212, -3.0308949947357178, -2.9072468280792236, -2.7835988998413086, -2.6599507331848145, -2.5363025665283203, -2.412654399871826, -2.289006471633911, -2.165358304977417, -2.041710138320923, -1.9180619716644287, -1.7944138050079346, -1.6707656383514404, -1.5471175909042358, -1.4234694242477417, -1.299821376800537, -1.176173210144043, -1.0525250434875488, -0.9288769364356995, -0.8052288293838501, -0.6815807223320007, -0.5579326152801514, -0.4342844486236572, -0.31063634157180786, -0.1869882345199585, -0.06334006786346436, 0.06030803918838501, 0.18395614624023438, 0.30760425329208374, 0.4312523901462555, 0.5549005270004272, 0.6785486340522766, 0.802196741104126, 0.9258449077606201, 1.0494930744171143, 1.1731411218643188, 1.296789288520813, 1.4204373359680176, 1.5440855026245117, 1.6677336692810059, 1.7913817167282104, 1.9150298833847046, 2.038677930831909, 2.1623260974884033, 2.2859742641448975, 2.4096224308013916, 2.5332703590393066, 2.656918525695801, 2.780566692352295, 2.904214859008789, 3.027863025665283, 3.1515111923217773, 3.2751593589782715, 3.3988075256347656, 3.5224556922912598, 3.646103620529175, 3.769751787185669, 3.893399953842163, 4.017047882080078, 4.140696048736572]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 3.0, 4.0, 7.0, 7.0, 15.0, 37.0, 68.0, 170.0, 577.0, 1603.0, 10461.0, 249047.0, 51187748.0, 17422.0, 2241.0, 579.0, 246.0, 98.0, 49.0, 34.0, 11.0, 12.0, 3.0, 6.0, 5.0, 5.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.59375, -17.95361328125, -17.3134765625, -16.67333984375, -16.033203125, -15.39306640625, -14.7529296875, -14.11279296875, -13.47265625, -12.83251953125, -12.1923828125, -11.55224609375, -10.912109375, -10.27197265625, -9.6318359375, -8.99169921875, -8.3515625, -7.71142578125, -7.0712890625, -6.43115234375, -5.791015625, -5.15087890625, -4.5107421875, -3.87060546875, -3.23046875, -2.59033203125, -1.9501953125, -1.31005859375, -0.669921875, -0.02978515625, 0.6103515625, 1.25048828125, 1.890625, 2.53076171875, 3.1708984375, 3.81103515625, 4.451171875, 5.09130859375, 5.7314453125, 6.37158203125, 7.01171875, 7.65185546875, 8.2919921875, 8.93212890625, 9.572265625, 10.21240234375, 10.8525390625, 11.49267578125, 12.1328125, 12.77294921875, 13.4130859375, 14.05322265625, 14.693359375, 15.33349609375, 15.9736328125, 16.61376953125, 17.25390625, 17.89404296875, 18.5341796875, 19.17431640625, 19.814453125, 20.45458984375, 21.0947265625, 21.73486328125, 22.375]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 5.0, 6.0, 1.0, 1.0, 11.0, 12.0, 11.0, 31.0, 49.0, 48.0, 91.0, 144.0, 203.0, 348.0, 471.0, 783.0, 1379.0, 2330.0, 3880.0, 6875.0, 12414.0, 22343.0, 40708.0, 76113.0, 138702.0, 239028.0, 375659.0, 528286.0, 3649618.0, 451694.0, 313432.0, 189470.0, 107555.0, 58313.0, 31436.0, 17177.0, 9502.0, 5392.0, 3223.0, 1801.0, 1110.0, 652.0, 393.0, 252.0, 160.0, 107.0, 61.0, 64.0, 41.0, 18.0, 17.0, 9.0, 3.0, 9.0, 2.0, 2.0], "bins": [-1.3916015625, -1.353240966796875, -1.31488037109375, -1.276519775390625, -1.2381591796875, -1.199798583984375, -1.16143798828125, -1.123077392578125, -1.084716796875, -1.046356201171875, -1.00799560546875, -0.969635009765625, -0.9312744140625, -0.892913818359375, -0.85455322265625, -0.816192626953125, -0.77783203125, -0.739471435546875, -0.70111083984375, -0.662750244140625, -0.6243896484375, -0.586029052734375, -0.54766845703125, -0.509307861328125, -0.470947265625, -0.432586669921875, -0.39422607421875, -0.355865478515625, -0.3175048828125, -0.279144287109375, -0.24078369140625, -0.202423095703125, -0.1640625, -0.125701904296875, -0.08734130859375, -0.048980712890625, -0.0106201171875, 0.027740478515625, 0.06610107421875, 0.104461669921875, 0.142822265625, 0.181182861328125, 0.21954345703125, 0.257904052734375, 0.2962646484375, 0.334625244140625, 0.37298583984375, 0.411346435546875, 0.44970703125, 0.488067626953125, 0.52642822265625, 0.564788818359375, 0.6031494140625, 0.641510009765625, 0.67987060546875, 0.718231201171875, 0.756591796875, 0.794952392578125, 0.83331298828125, 0.871673583984375, 0.9100341796875, 0.948394775390625, 0.98675537109375, 1.025115966796875, 1.0634765625]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 5.0, 10.0, 3.0, 9.0, 8.0, 10.0, 15.0, 13.0, 27.0, 17.0, 27.0, 36.0, 33.0, 44.0, 41.0, 45.0, 57.0, 62.0, 1069.0, 57.0, 51.0, 53.0, 43.0, 44.0, 47.0, 39.0, 33.0, 20.0, 24.0, 21.0, 16.0, 15.0, 6.0, 9.0, 6.0, 2.0, 5.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0], "bins": [-25.90625, -25.231689453125, -24.55712890625, -23.882568359375, -23.2080078125, -22.533447265625, -21.85888671875, -21.184326171875, -20.509765625, -19.835205078125, -19.16064453125, -18.486083984375, -17.8115234375, -17.136962890625, -16.46240234375, -15.787841796875, -15.11328125, -14.438720703125, -13.76416015625, -13.089599609375, -12.4150390625, -11.740478515625, -11.06591796875, -10.391357421875, -9.716796875, -9.042236328125, -8.36767578125, -7.693115234375, -7.0185546875, -6.343994140625, -5.66943359375, -4.994873046875, -4.3203125, -3.645751953125, -2.97119140625, -2.296630859375, -1.6220703125, -0.947509765625, -0.27294921875, 0.401611328125, 1.076171875, 1.750732421875, 2.42529296875, 3.099853515625, 3.7744140625, 4.448974609375, 5.12353515625, 5.798095703125, 6.47265625, 7.147216796875, 7.82177734375, 8.496337890625, 9.1708984375, 9.845458984375, 10.52001953125, 11.194580078125, 11.869140625, 12.543701171875, 13.21826171875, 13.892822265625, 14.5673828125, 15.241943359375, 15.91650390625, 16.591064453125, 17.265625]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [6.0, 1.0, 7.0, 7.0, 10.0, 9.0, 19.0, 23.0, 50.0, 56.0, 104.0, 135.0, 220.0, 321.0, 489.0, 787.0, 1196.0, 1879.0, 2983.0, 4851.0, 8047.0, 13192.0, 21361.0, 35923.0, 58676.0, 95352.0, 150522.0, 223100.0, 309431.0, 386544.0, 3535032.0, 425368.0, 329570.0, 243953.0, 165967.0, 106690.0, 66348.0, 40233.0, 24408.0, 14533.0, 9013.0, 5527.0, 3371.0, 2131.0, 1340.0, 936.0, 589.0, 395.0, 242.0, 158.0, 101.0, 79.0, 61.0, 42.0, 18.0, 14.0, 14.0, 7.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0], "bins": [-0.87548828125, -0.846893310546875, -0.81829833984375, -0.789703369140625, -0.7611083984375, -0.732513427734375, -0.70391845703125, -0.675323486328125, -0.646728515625, -0.618133544921875, -0.58953857421875, -0.560943603515625, -0.5323486328125, -0.503753662109375, -0.47515869140625, -0.446563720703125, -0.41796875, -0.389373779296875, -0.36077880859375, -0.332183837890625, -0.3035888671875, -0.274993896484375, -0.24639892578125, -0.217803955078125, -0.189208984375, -0.160614013671875, -0.13201904296875, -0.103424072265625, -0.0748291015625, -0.046234130859375, -0.01763916015625, 0.010955810546875, 0.03955078125, 0.068145751953125, 0.09674072265625, 0.125335693359375, 0.1539306640625, 0.182525634765625, 0.21112060546875, 0.239715576171875, 0.268310546875, 0.296905517578125, 0.32550048828125, 0.354095458984375, 0.3826904296875, 0.411285400390625, 0.43988037109375, 0.468475341796875, 0.4970703125, 0.525665283203125, 0.55426025390625, 0.582855224609375, 0.6114501953125, 0.640045166015625, 0.66864013671875, 0.697235107421875, 0.725830078125, 0.754425048828125, 0.78302001953125, 0.811614990234375, 0.8402099609375, 0.868804931640625, 0.89739990234375, 0.925994873046875, 0.95458984375]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 7.0, 10.0, 6.0, 13.0, 16.0, 18.0, 25.0, 18.0, 20.0, 34.0, 42.0, 38.0, 36.0, 43.0, 41.0, 39.0, 51.0, 1036.0, 73.0, 45.0, 53.0, 44.0, 37.0, 47.0, 43.0, 37.0, 21.0, 24.0, 26.0, 13.0, 18.0, 12.0, 12.0, 8.0, 6.0, 2.0, 3.0, 3.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.875, -17.327392578125, -16.77978515625, -16.232177734375, -15.6845703125, -15.136962890625, -14.58935546875, -14.041748046875, -13.494140625, -12.946533203125, -12.39892578125, -11.851318359375, -11.3037109375, -10.756103515625, -10.20849609375, -9.660888671875, -9.11328125, -8.565673828125, -8.01806640625, -7.470458984375, -6.9228515625, -6.375244140625, -5.82763671875, -5.280029296875, -4.732421875, -4.184814453125, -3.63720703125, -3.089599609375, -2.5419921875, -1.994384765625, -1.44677734375, -0.899169921875, -0.3515625, 0.196044921875, 0.74365234375, 1.291259765625, 1.8388671875, 2.386474609375, 2.93408203125, 3.481689453125, 4.029296875, 4.576904296875, 5.12451171875, 5.672119140625, 6.2197265625, 6.767333984375, 7.31494140625, 7.862548828125, 8.41015625, 8.957763671875, 9.50537109375, 10.052978515625, 10.6005859375, 11.148193359375, 11.69580078125, 12.243408203125, 12.791015625, 13.338623046875, 13.88623046875, 14.433837890625, 14.9814453125, 15.529052734375, 16.07666015625, 16.624267578125, 17.171875]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 4.0, 12.0, 17.0, 17.0, 23.0, 35.0, 41.0, 49.0, 64.0, 101.0, 151.0, 254.0, 418.0, 686.0, 1228.0, 2089.0, 3947.0, 7584.0, 14279.0, 28177.0, 55850.0, 113091.0, 5641262.0, 239639.0, 89440.0, 44455.0, 22851.0, 11958.0, 6082.0, 3157.0, 1795.0, 1066.0, 559.0, 337.0, 220.0, 160.0, 118.0, 62.0, 39.0, 28.0, 24.0, 15.0, 14.0, 8.0, 7.0, 6.0, 4.0, 9.0, 5.0, 0.0, 0.0, 5.0, 2.0, 2.0, 1.0], "bins": [-3.294921875, -3.191436767578125, -3.08795166015625, -2.984466552734375, -2.8809814453125, -2.777496337890625, -2.67401123046875, -2.570526123046875, -2.467041015625, -2.363555908203125, -2.26007080078125, -2.156585693359375, -2.0531005859375, -1.949615478515625, -1.84613037109375, -1.742645263671875, -1.63916015625, -1.535675048828125, -1.43218994140625, -1.328704833984375, -1.2252197265625, -1.121734619140625, -1.01824951171875, -0.914764404296875, -0.811279296875, -0.707794189453125, -0.60430908203125, -0.500823974609375, -0.3973388671875, -0.293853759765625, -0.19036865234375, -0.086883544921875, 0.0166015625, 0.120086669921875, 0.22357177734375, 0.327056884765625, 0.4305419921875, 0.534027099609375, 0.63751220703125, 0.740997314453125, 0.844482421875, 0.947967529296875, 1.05145263671875, 1.154937744140625, 1.2584228515625, 1.361907958984375, 1.46539306640625, 1.568878173828125, 1.67236328125, 1.775848388671875, 1.87933349609375, 1.982818603515625, 2.0863037109375, 2.189788818359375, 2.29327392578125, 2.396759033203125, 2.500244140625, 2.603729248046875, 2.70721435546875, 2.810699462890625, 2.9141845703125, 3.017669677734375, 3.12115478515625, 3.224639892578125, 3.328125]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 3.0, 4.0, 9.0, 11.0, 8.0, 15.0, 11.0, 17.0, 26.0, 24.0, 28.0, 32.0, 36.0, 43.0, 44.0, 39.0, 43.0, 38.0, 83.0, 1037.0, 46.0, 47.0, 41.0, 40.0, 37.0, 33.0, 41.0, 34.0, 26.0, 23.0, 21.0, 19.0, 18.0, 8.0, 10.0, 5.0, 12.0, 7.0, 4.0, 2.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.28125, -15.79248046875, -15.3037109375, -14.81494140625, -14.326171875, -13.83740234375, -13.3486328125, -12.85986328125, -12.37109375, -11.88232421875, -11.3935546875, -10.90478515625, -10.416015625, -9.92724609375, -9.4384765625, -8.94970703125, -8.4609375, -7.97216796875, -7.4833984375, -6.99462890625, -6.505859375, -6.01708984375, -5.5283203125, -5.03955078125, -4.55078125, -4.06201171875, -3.5732421875, -3.08447265625, -2.595703125, -2.10693359375, -1.6181640625, -1.12939453125, -0.640625, -0.15185546875, 0.3369140625, 0.82568359375, 1.314453125, 1.80322265625, 2.2919921875, 2.78076171875, 3.26953125, 3.75830078125, 4.2470703125, 4.73583984375, 5.224609375, 5.71337890625, 6.2021484375, 6.69091796875, 7.1796875, 7.66845703125, 8.1572265625, 8.64599609375, 9.134765625, 9.62353515625, 10.1123046875, 10.60107421875, 11.08984375, 11.57861328125, 12.0673828125, 12.55615234375, 13.044921875, 13.53369140625, 14.0224609375, 14.51123046875, 15.0]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 19.0, 60.0, 346.0, 436.0, 106.0, 27.0, 8.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.49773406982422, -61.635929107666016, -59.77412033081055, -57.912315368652344, -56.050506591796875, -54.18870162963867, -52.32689666748047, -50.465087890625, -48.6032829284668, -46.741477966308594, -44.879669189453125, -43.01786422729492, -41.15605926513672, -39.29425048828125, -37.43244552612305, -35.570640563964844, -33.708831787109375, -31.84702491760254, -29.985218048095703, -28.1234130859375, -26.261606216430664, -24.399799346923828, -22.537994384765625, -20.67618751525879, -18.814380645751953, -16.952573776245117, -15.090767860412598, -13.228961944580078, -11.367155075073242, -9.505348205566406, -7.643542289733887, -5.781736373901367, -3.9199295043945312, -2.0581231117248535, -0.19631671905517578, 1.665489673614502, 3.5272960662841797, 5.389102935791016, 7.250908851623535, 9.112714767456055, 10.97452163696289, 12.836328506469727, 14.698134422302246, 16.559940338134766, 18.4217472076416, 20.283554077148438, 22.14535903930664, 24.007165908813477, 25.868972778320312, 27.73077964782715, 29.592586517333984, 31.454391479492188, 33.316200256347656, 35.17800521850586, 37.03981018066406, 38.90161895751953, 40.763423919677734, 42.62522888183594, 44.487037658691406, 46.34884262084961, 48.21064758300781, 50.07245635986328, 51.934261322021484, 53.79606628417969, 55.657875061035156]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 4.0, 8.0, 6.0, 10.0, 11.0, 8.0, 7.0, 14.0, 26.0, 18.0, 30.0, 41.0, 47.0, 54.0, 66.0, 71.0, 78.0, 84.0, 69.0, 72.0, 60.0, 36.0, 39.0, 31.0, 22.0, 20.0, 18.0, 11.0, 8.0, 9.0, 8.0, 5.0, 5.0, 4.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-44.118831634521484, -42.92047119140625, -41.72210693359375, -40.52374267578125, -39.325382232666016, -38.12702178955078, -36.92865753173828, -35.73029327392578, -34.53193283081055, -33.33357238769531, -32.13520812988281, -30.936845779418945, -29.738483428955078, -28.54012107849121, -27.341758728027344, -26.143396377563477, -24.94503402709961, -23.746671676635742, -22.548309326171875, -21.349946975708008, -20.15158462524414, -18.953222274780273, -17.754859924316406, -16.55649757385254, -15.358135223388672, -14.159772872924805, -12.961410522460938, -11.76304817199707, -10.564685821533203, -9.366323471069336, -8.167961120605469, -6.969598770141602, -5.771232604980469, -4.572870254516602, -3.3745079040527344, -2.176145553588867, -0.977783203125, 0.2205791473388672, 1.4189414978027344, 2.6173038482666016, 3.8156661987304688, 5.014028549194336, 6.212390899658203, 7.41075325012207, 8.609115600585938, 9.807477951049805, 11.005840301513672, 12.204202651977539, 13.402565002441406, 14.600927352905273, 15.79928970336914, 16.997652053833008, 18.196014404296875, 19.394376754760742, 20.59273910522461, 21.791101455688477, 22.989463806152344, 24.18782615661621, 25.386188507080078, 26.584550857543945, 27.782913208007812, 28.98127555847168, 30.179637908935547, 31.378000259399414, 32.57636260986328]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 4.0, 6.0, 9.0, 9.0, 10.0, 18.0, 18.0, 27.0, 41.0, 53.0, 50.0, 97.0, 140.0, 231.0, 378.0, 596.0, 1106.0, 1920.0, 4064.0, 10624.0, 39314.0, 3876150.0, 216255.0, 27384.0, 8435.0, 3497.0, 1648.0, 843.0, 494.0, 277.0, 187.0, 128.0, 87.0, 69.0, 30.0, 25.0, 13.0, 17.0, 15.0, 6.0, 5.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.284912109375, -0.2767353057861328, -0.2685585021972656, -0.26038169860839844, -0.25220489501953125, -0.24402809143066406, -0.23585128784179688, -0.2276744842529297, -0.2194976806640625, -0.2113208770751953, -0.20314407348632812, -0.19496726989746094, -0.18679046630859375, -0.17861366271972656, -0.17043685913085938, -0.1622600555419922, -0.154083251953125, -0.1459064483642578, -0.13772964477539062, -0.12955284118652344, -0.12137603759765625, -0.11319923400878906, -0.10502243041992188, -0.09684562683105469, -0.0886688232421875, -0.08049201965332031, -0.07231521606445312, -0.06413841247558594, -0.05596160888671875, -0.04778480529785156, -0.039608001708984375, -0.03143119812011719, -0.02325439453125, -0.015077590942382812, -0.006900787353515625, 0.0012760162353515625, 0.00945281982421875, 0.017629623413085938, 0.025806427001953125, 0.03398323059082031, 0.0421600341796875, 0.05033683776855469, 0.058513641357421875, 0.06669044494628906, 0.07486724853515625, 0.08304405212402344, 0.09122085571289062, 0.09939765930175781, 0.107574462890625, 0.11575126647949219, 0.12392807006835938, 0.13210487365722656, 0.14028167724609375, 0.14845848083496094, 0.15663528442382812, 0.1648120880126953, 0.1729888916015625, 0.1811656951904297, 0.18934249877929688, 0.19751930236816406, 0.20569610595703125, 0.21387290954589844, 0.22204971313476562, 0.2302265167236328, 0.2384033203125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 5.0, 4.0, 3.0, 3.0, 2.0, 3.0, 3.0, 11.0, 7.0, 10.0, 14.0, 9.0, 13.0, 145.0, 633.0, 13.0, 16.0, 15.0, 6.0, 3.0, 9.0, 6.0, 8.0, 8.0, 4.0, 5.0, 4.0, 8.0, 4.0, 4.0, 4.0, 2.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.126708984375, -0.12277412414550781, -0.11883926391601562, -0.11490440368652344, -0.11096954345703125, -0.10703468322753906, -0.10309982299804688, -0.09916496276855469, -0.0952301025390625, -0.09129524230957031, -0.08736038208007812, -0.08342552185058594, -0.07949066162109375, -0.07555580139160156, -0.07162094116210938, -0.06768608093261719, -0.063751220703125, -0.05981636047363281, -0.055881500244140625, -0.05194664001464844, -0.04801177978515625, -0.04407691955566406, -0.040142059326171875, -0.03620719909667969, -0.0322723388671875, -0.028337478637695312, -0.024402618408203125, -0.020467758178710938, -0.01653289794921875, -0.012598037719726562, -0.008663177490234375, -0.0047283172607421875, -0.00079345703125, 0.0031414031982421875, 0.007076263427734375, 0.011011123657226562, 0.01494598388671875, 0.018880844116210938, 0.022815704345703125, 0.026750564575195312, 0.0306854248046875, 0.03462028503417969, 0.038555145263671875, 0.04249000549316406, 0.04642486572265625, 0.05035972595214844, 0.054294586181640625, 0.05822944641113281, 0.062164306640625, 0.06609916687011719, 0.07003402709960938, 0.07396888732910156, 0.07790374755859375, 0.08183860778808594, 0.08577346801757812, 0.08970832824707031, 0.0936431884765625, 0.09757804870605469, 0.10151290893554688, 0.10544776916503906, 0.10938262939453125, 0.11331748962402344, 0.11725234985351562, 0.12118721008300781, 0.1251220703125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 1.0, 7.0, 11.0, 11.0, 8.0, 15.0, 31.0, 47.0, 76.0, 104.0, 190.0, 242.0, 519.0, 898.0, 1891.0, 4489.0, 12288.0, 51202.0, 528236.0, 3384147.0, 172474.0, 25364.0, 7039.0, 2568.0, 1187.0, 555.0, 277.0, 140.0, 81.0, 66.0, 38.0, 34.0, 17.0, 13.0, 6.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1990966796875, -0.19329452514648438, -0.18749237060546875, -0.18169021606445312, -0.1758880615234375, -0.17008590698242188, -0.16428375244140625, -0.15848159790039062, -0.152679443359375, -0.14687728881835938, -0.14107513427734375, -0.13527297973632812, -0.1294708251953125, -0.12366867065429688, -0.11786651611328125, -0.11206436157226562, -0.10626220703125, -0.10046005249023438, -0.09465789794921875, -0.08885574340820312, -0.0830535888671875, -0.07725143432617188, -0.07144927978515625, -0.06564712524414062, -0.059844970703125, -0.054042816162109375, -0.04824066162109375, -0.042438507080078125, -0.0366363525390625, -0.030834197998046875, -0.02503204345703125, -0.019229888916015625, -0.013427734375, -0.007625579833984375, -0.00182342529296875, 0.003978729248046875, 0.0097808837890625, 0.015583038330078125, 0.02138519287109375, 0.027187347412109375, 0.032989501953125, 0.038791656494140625, 0.04459381103515625, 0.050395965576171875, 0.0561981201171875, 0.062000274658203125, 0.06780242919921875, 0.07360458374023438, 0.07940673828125, 0.08520889282226562, 0.09101104736328125, 0.09681320190429688, 0.1026153564453125, 0.10841751098632812, 0.11421966552734375, 0.12002182006835938, 0.125823974609375, 0.13162612915039062, 0.13742828369140625, 0.14323043823242188, 0.1490325927734375, 0.15483474731445312, 0.16063690185546875, 0.16643905639648438, 0.1722412109375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 2.0, 2.0, 6.0, 1.0, 4.0, 7.0, 8.0, 18.0, 21.0, 24.0, 43.0, 56.0, 111.0, 218.0, 511.0, 1617.0, 822.0, 295.0, 125.0, 68.0, 45.0, 22.0, 10.0, 12.0, 12.0, 4.0, 1.0, 3.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1673583984375, -0.16324996948242188, -0.15914154052734375, -0.15503311157226562, -0.1509246826171875, -0.14681625366210938, -0.14270782470703125, -0.13859939575195312, -0.134490966796875, -0.13038253784179688, -0.12627410888671875, -0.12216567993164062, -0.1180572509765625, -0.11394882202148438, -0.10984039306640625, -0.10573196411132812, -0.10162353515625, -0.09751510620117188, -0.09340667724609375, -0.08929824829101562, -0.0851898193359375, -0.08108139038085938, -0.07697296142578125, -0.07286453247070312, -0.068756103515625, -0.06464767456054688, -0.06053924560546875, -0.056430816650390625, -0.0523223876953125, -0.048213958740234375, -0.04410552978515625, -0.039997100830078125, -0.035888671875, -0.031780242919921875, -0.02767181396484375, -0.023563385009765625, -0.0194549560546875, -0.015346527099609375, -0.01123809814453125, -0.007129669189453125, -0.003021240234375, 0.001087188720703125, 0.00519561767578125, 0.009304046630859375, 0.0134124755859375, 0.017520904541015625, 0.02162933349609375, 0.025737762451171875, 0.02984619140625, 0.033954620361328125, 0.03806304931640625, 0.042171478271484375, 0.0462799072265625, 0.050388336181640625, 0.05449676513671875, 0.058605194091796875, 0.062713623046875, 0.06682205200195312, 0.07093048095703125, 0.07503890991210938, 0.0791473388671875, 0.08325576782226562, 0.08736419677734375, 0.09147262573242188, 0.0955810546875]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 6.0, 24.0, 341.0, 604.0, 26.0, 7.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9000369310379028, -0.8366281986236572, -0.7732194662094116, -0.7098106741905212, -0.6464019417762756, -0.58299320936203, -0.5195844173431396, -0.45617568492889404, -0.39276695251464844, -0.32935822010040283, -0.26594945788383484, -0.20254071056842804, -0.13913196325302124, -0.07572323083877563, -0.012314468622207642, 0.05109429359436035, 0.11450302600860596, 0.17791177332401276, 0.24132052063941956, 0.30472928285598755, 0.36813801527023315, 0.43154674768447876, 0.49495550990104675, 0.5583642721176147, 0.6217730045318604, 0.685181736946106, 0.7485904693603516, 0.8119992613792419, 0.8754079937934875, 0.9388167262077332, 1.0022255182266235, 1.0656342506408691, 1.1290431022644043, 1.19245183467865, 1.2558605670928955, 1.3192692995071411, 1.3826780319213867, 1.4460868835449219, 1.5094956159591675, 1.572904348373413, 1.6363130807876587, 1.6997218132019043, 1.76313054561615, 1.8265392780303955, 1.8899481296539307, 1.9533567428588867, 2.016765594482422, 2.080174446105957, 2.143583059310913, 2.2069919109344482, 2.2704005241394043, 2.3338093757629395, 2.3972179889678955, 2.4606268405914307, 2.5240354537963867, 2.587444305419922, 2.650853157043457, 2.714262008666992, 2.7776706218719482, 2.8410794734954834, 2.9044880867004395, 2.9678969383239746, 3.0313055515289307, 3.094714403152466, 3.158123016357422]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 3.0, 6.0, 4.0, 3.0, 7.0, 9.0, 10.0, 13.0, 22.0, 22.0, 25.0, 43.0, 36.0, 56.0, 70.0, 90.0, 70.0, 83.0, 78.0, 75.0, 62.0, 57.0, 44.0, 30.0, 29.0, 15.0, 12.0, 10.0, 10.0, 4.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3349156975746155, -0.3195090889930725, -0.30410248041152954, -0.2886958718299866, -0.2732892632484436, -0.25788265466690063, -0.24247604608535767, -0.2270694375038147, -0.21166282892227173, -0.19625622034072876, -0.1808496117591858, -0.16544300317764282, -0.15003639459609985, -0.13462978601455688, -0.11922316998243332, -0.10381656140089035, -0.08840994536876678, -0.07300333678722382, -0.05759672820568085, -0.04219011589884758, -0.02678350731730461, -0.011376895010471344, 0.004029713571071625, 0.019436322152614594, 0.03484293073415756, 0.05024953931570053, 0.0656561478972435, 0.08106276392936707, 0.09646937251091003, 0.111875981092453, 0.12728258967399597, 0.14268919825553894, 0.1580958068370819, 0.17350241541862488, 0.18890902400016785, 0.20431563258171082, 0.21972224116325378, 0.23512884974479675, 0.2505354583263397, 0.2659420669078827, 0.28134867548942566, 0.29675528407096863, 0.3121618926525116, 0.32756850123405457, 0.34297510981559753, 0.3583817183971405, 0.37378832697868347, 0.38919493556022644, 0.4046015739440918, 0.42000818252563477, 0.43541479110717773, 0.4508213996887207, 0.46622800827026367, 0.48163461685180664, 0.4970412254333496, 0.5124478340148926, 0.5278544425964355, 0.5432610511779785, 0.5586676597595215, 0.5740742683410645, 0.5894808769226074, 0.6048874855041504, 0.6202940940856934, 0.6357007026672363, 0.6511073112487793]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 6.0, 7.0, 13.0, 14.0, 28.0, 31.0, 37.0, 47.0, 71.0, 83.0, 107.0, 135.0, 221.0, 237.0, 369.0, 428.0, 620.0, 795.0, 1071.0, 1373.0, 1957.0, 2729.0, 3981.0, 5776.0, 9028.0, 14686.0, 25925.0, 88531.0, 806472.0, 33025.0, 17521.0, 10430.0, 6715.0, 4458.0, 3181.0, 2224.0, 1598.0, 1173.0, 891.0, 626.0, 475.0, 326.0, 251.0, 226.0, 132.0, 142.0, 78.0, 73.0, 64.0, 41.0, 32.0, 35.0, 21.0, 17.0, 14.0, 6.0, 7.0, 5.0, 1.0, 3.0], "bins": [-0.422119140625, -0.40899658203125, -0.3958740234375, -0.38275146484375, -0.36962890625, -0.35650634765625, -0.3433837890625, -0.33026123046875, -0.317138671875, -0.30401611328125, -0.2908935546875, -0.27777099609375, -0.2646484375, -0.25152587890625, -0.2384033203125, -0.22528076171875, -0.212158203125, -0.19903564453125, -0.1859130859375, -0.17279052734375, -0.15966796875, -0.14654541015625, -0.1334228515625, -0.12030029296875, -0.107177734375, -0.09405517578125, -0.0809326171875, -0.06781005859375, -0.0546875, -0.04156494140625, -0.0284423828125, -0.01531982421875, -0.002197265625, 0.01092529296875, 0.0240478515625, 0.03717041015625, 0.05029296875, 0.06341552734375, 0.0765380859375, 0.08966064453125, 0.102783203125, 0.11590576171875, 0.1290283203125, 0.14215087890625, 0.1552734375, 0.16839599609375, 0.1815185546875, 0.19464111328125, 0.207763671875, 0.22088623046875, 0.2340087890625, 0.24713134765625, 0.26025390625, 0.27337646484375, 0.2864990234375, 0.29962158203125, 0.312744140625, 0.32586669921875, 0.3389892578125, 0.35211181640625, 0.365234375, 0.37835693359375, 0.3914794921875, 0.40460205078125, 0.417724609375]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 5.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 3.0, 2.0, 4.0, 3.0, 2.0, 13.0, 6.0, 10.0, 10.0, 11.0, 8.0, 52.0, 696.0, 44.0, 14.0, 20.0, 6.0, 5.0, 5.0, 6.0, 7.0, 11.0, 3.0, 5.0, 6.0, 5.0, 6.0, 3.0, 3.0, 5.0, 4.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.12353515625, -0.1197500228881836, -0.11596488952636719, -0.11217975616455078, -0.10839462280273438, -0.10460948944091797, -0.10082435607910156, -0.09703922271728516, -0.09325408935546875, -0.08946895599365234, -0.08568382263183594, -0.08189868927001953, -0.07811355590820312, -0.07432842254638672, -0.07054328918457031, -0.0667581558227539, -0.0629730224609375, -0.059187889099121094, -0.05540275573730469, -0.05161762237548828, -0.047832489013671875, -0.04404735565185547, -0.04026222229003906, -0.036477088928222656, -0.03269195556640625, -0.028906822204589844, -0.025121688842773438, -0.02133655548095703, -0.017551422119140625, -0.013766288757324219, -0.009981155395507812, -0.006196022033691406, -0.002410888671875, 0.0013742446899414062, 0.0051593780517578125, 0.008944511413574219, 0.012729644775390625, 0.01651477813720703, 0.020299911499023438, 0.024085044860839844, 0.02787017822265625, 0.031655311584472656, 0.03544044494628906, 0.03922557830810547, 0.043010711669921875, 0.04679584503173828, 0.05058097839355469, 0.054366111755371094, 0.0581512451171875, 0.061936378479003906, 0.06572151184082031, 0.06950664520263672, 0.07329177856445312, 0.07707691192626953, 0.08086204528808594, 0.08464717864990234, 0.08843231201171875, 0.09221744537353516, 0.09600257873535156, 0.09978771209716797, 0.10357284545898438, 0.10735797882080078, 0.11114311218261719, 0.1149282455444336, 0.11871337890625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 4.0, 5.0, 9.0, 11.0, 16.0, 21.0, 24.0, 41.0, 51.0, 71.0, 113.0, 136.0, 206.0, 288.0, 511.0, 922.0, 1795.0, 4271.0, 11152.0, 33080.0, 115840.0, 438113.0, 322489.0, 79765.0, 24062.0, 8390.0, 3319.0, 1604.0, 792.0, 460.0, 293.0, 213.0, 151.0, 107.0, 73.0, 52.0, 25.0, 28.0, 14.0, 12.0, 6.0, 5.0, 8.0, 5.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.306640625, -0.2960166931152344, -0.28539276123046875, -0.2747688293457031, -0.2641448974609375, -0.2535209655761719, -0.24289703369140625, -0.23227310180664062, -0.221649169921875, -0.21102523803710938, -0.20040130615234375, -0.18977737426757812, -0.1791534423828125, -0.16852951049804688, -0.15790557861328125, -0.14728164672851562, -0.13665771484375, -0.12603378295898438, -0.11540985107421875, -0.10478591918945312, -0.0941619873046875, -0.08353805541992188, -0.07291412353515625, -0.062290191650390625, -0.051666259765625, -0.041042327880859375, -0.03041839599609375, -0.019794464111328125, -0.0091705322265625, 0.001453399658203125, 0.01207733154296875, 0.022701263427734375, 0.0333251953125, 0.043949127197265625, 0.05457305908203125, 0.06519699096679688, 0.0758209228515625, 0.08644485473632812, 0.09706878662109375, 0.10769271850585938, 0.118316650390625, 0.12894058227539062, 0.13956451416015625, 0.15018844604492188, 0.1608123779296875, 0.17143630981445312, 0.18206024169921875, 0.19268417358398438, 0.20330810546875, 0.21393203735351562, 0.22455596923828125, 0.23517990112304688, 0.2458038330078125, 0.2564277648925781, 0.26705169677734375, 0.2776756286621094, 0.288299560546875, 0.2989234924316406, 0.30954742431640625, 0.3201713562011719, 0.3307952880859375, 0.3414192199707031, 0.35204315185546875, 0.3626670837402344, 0.373291015625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 8.0, 3.0, 10.0, 9.0, 6.0, 22.0, 13.0, 16.0, 23.0, 33.0, 28.0, 26.0, 48.0, 34.0, 34.0, 42.0, 43.0, 50.0, 59.0, 43.0, 37.0, 53.0, 55.0, 33.0, 35.0, 30.0, 14.0, 31.0, 26.0, 21.0, 22.0, 26.0, 9.0, 16.0, 17.0, 7.0, 7.0, 6.0, 3.0, 4.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.525390625, -0.509063720703125, -0.49273681640625, -0.476409912109375, -0.4600830078125, -0.443756103515625, -0.42742919921875, -0.411102294921875, -0.394775390625, -0.378448486328125, -0.36212158203125, -0.345794677734375, -0.3294677734375, -0.313140869140625, -0.29681396484375, -0.280487060546875, -0.26416015625, -0.247833251953125, -0.23150634765625, -0.215179443359375, -0.1988525390625, -0.182525634765625, -0.16619873046875, -0.149871826171875, -0.133544921875, -0.117218017578125, -0.10089111328125, -0.084564208984375, -0.0682373046875, -0.051910400390625, -0.03558349609375, -0.019256591796875, -0.0029296875, 0.013397216796875, 0.02972412109375, 0.046051025390625, 0.0623779296875, 0.078704833984375, 0.09503173828125, 0.111358642578125, 0.127685546875, 0.144012451171875, 0.16033935546875, 0.176666259765625, 0.1929931640625, 0.209320068359375, 0.22564697265625, 0.241973876953125, 0.25830078125, 0.274627685546875, 0.29095458984375, 0.307281494140625, 0.3236083984375, 0.339935302734375, 0.35626220703125, 0.372589111328125, 0.388916015625, 0.405242919921875, 0.42156982421875, 0.437896728515625, 0.4542236328125, 0.470550537109375, 0.48687744140625, 0.503204345703125, 0.51953125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 6.0, 6.0, 8.0, 9.0, 10.0, 13.0, 20.0, 23.0, 40.0, 44.0, 92.0, 134.0, 237.0, 417.0, 969.0, 2410.0, 7379.0, 41362.0, 886662.0, 92219.0, 10769.0, 3291.0, 1244.0, 532.0, 246.0, 151.0, 71.0, 43.0, 38.0, 39.0, 25.0, 14.0, 11.0, 6.0, 10.0, 7.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.74951171875, -0.7265472412109375, -0.703582763671875, -0.6806182861328125, -0.65765380859375, -0.6346893310546875, -0.611724853515625, -0.5887603759765625, -0.5657958984375, -0.5428314208984375, -0.519866943359375, -0.4969024658203125, -0.47393798828125, -0.4509735107421875, -0.428009033203125, -0.4050445556640625, -0.382080078125, -0.3591156005859375, -0.336151123046875, -0.3131866455078125, -0.29022216796875, -0.2672576904296875, -0.244293212890625, -0.2213287353515625, -0.1983642578125, -0.1753997802734375, -0.152435302734375, -0.1294708251953125, -0.10650634765625, -0.0835418701171875, -0.060577392578125, -0.0376129150390625, -0.0146484375, 0.0083160400390625, 0.031280517578125, 0.0542449951171875, 0.07720947265625, 0.1001739501953125, 0.123138427734375, 0.1461029052734375, 0.1690673828125, 0.1920318603515625, 0.214996337890625, 0.2379608154296875, 0.26092529296875, 0.2838897705078125, 0.306854248046875, 0.3298187255859375, 0.352783203125, 0.3757476806640625, 0.398712158203125, 0.4216766357421875, 0.44464111328125, 0.4676055908203125, 0.490570068359375, 0.5135345458984375, 0.5364990234375, 0.5594635009765625, 0.582427978515625, 0.6053924560546875, 0.62835693359375, 0.6513214111328125, 0.674285888671875, 0.6972503662109375, 0.72021484375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 2.0, 4.0, 13.0, 15.0, 14.0, 14.0, 29.0, 29.0, 53.0, 70.0, 97.0, 112.0, 102.0, 101.0, 87.0, 63.0, 44.0, 34.0, 31.0, 30.0, 13.0, 18.0, 7.0, 5.0, 3.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.6684017181396484e-05, -5.446188151836395e-05, -5.223974585533142e-05, -5.001761019229889e-05, -4.779547452926636e-05, -4.5573338866233826e-05, -4.3351203203201294e-05, -4.112906754016876e-05, -3.890693187713623e-05, -3.66847962141037e-05, -3.446266055107117e-05, -3.2240524888038635e-05, -3.0018389225006104e-05, -2.7796253561973572e-05, -2.557411789894104e-05, -2.3351982235908508e-05, -2.1129846572875977e-05, -1.8907710909843445e-05, -1.6685575246810913e-05, -1.4463439583778381e-05, -1.224130392074585e-05, -1.0019168257713318e-05, -7.797032594680786e-06, -5.574896931648254e-06, -3.3527612686157227e-06, -1.130625605583191e-06, 1.0915100574493408e-06, 3.3136457204818726e-06, 5.535781383514404e-06, 7.757917046546936e-06, 9.980052709579468e-06, 1.2202188372612e-05, 1.4424324035644531e-05, 1.6646459698677063e-05, 1.8868595361709595e-05, 2.1090731024742126e-05, 2.3312866687774658e-05, 2.553500235080719e-05, 2.775713801383972e-05, 2.9979273676872253e-05, 3.2201409339904785e-05, 3.442354500293732e-05, 3.664568066596985e-05, 3.886781632900238e-05, 4.108995199203491e-05, 4.3312087655067444e-05, 4.5534223318099976e-05, 4.775635898113251e-05, 4.997849464416504e-05, 5.220063030719757e-05, 5.44227659702301e-05, 5.6644901633262634e-05, 5.8867037296295166e-05, 6.10891729593277e-05, 6.331130862236023e-05, 6.553344428539276e-05, 6.775557994842529e-05, 6.997771561145782e-05, 7.219985127449036e-05, 7.442198693752289e-05, 7.664412260055542e-05, 7.886625826358795e-05, 8.108839392662048e-05, 8.331052958965302e-05, 8.553266525268555e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 8.0, 8.0, 10.0, 16.0, 20.0, 27.0, 45.0, 90.0, 122.0, 231.0, 445.0, 994.0, 3176.0, 12186.0, 87637.0, 812940.0, 110735.0, 13925.0, 3479.0, 1266.0, 551.0, 250.0, 143.0, 76.0, 54.0, 31.0, 25.0, 16.0, 10.0, 7.0, 5.0, 7.0, 1.0, 2.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4765625, -0.46096038818359375, -0.4453582763671875, -0.42975616455078125, -0.414154052734375, -0.39855194091796875, -0.3829498291015625, -0.36734771728515625, -0.35174560546875, -0.33614349365234375, -0.3205413818359375, -0.30493927001953125, -0.289337158203125, -0.27373504638671875, -0.2581329345703125, -0.24253082275390625, -0.2269287109375, -0.21132659912109375, -0.1957244873046875, -0.18012237548828125, -0.164520263671875, -0.14891815185546875, -0.1333160400390625, -0.11771392822265625, -0.10211181640625, -0.08650970458984375, -0.0709075927734375, -0.05530548095703125, -0.039703369140625, -0.02410125732421875, -0.0084991455078125, 0.00710296630859375, 0.022705078125, 0.03830718994140625, 0.0539093017578125, 0.06951141357421875, 0.085113525390625, 0.10071563720703125, 0.1163177490234375, 0.13191986083984375, 0.14752197265625, 0.16312408447265625, 0.1787261962890625, 0.19432830810546875, 0.209930419921875, 0.22553253173828125, 0.2411346435546875, 0.25673675537109375, 0.2723388671875, 0.28794097900390625, 0.3035430908203125, 0.31914520263671875, 0.334747314453125, 0.35034942626953125, 0.3659515380859375, 0.38155364990234375, 0.39715576171875, 0.41275787353515625, 0.4283599853515625, 0.44396209716796875, 0.459564208984375, 0.47516632080078125, 0.4907684326171875, 0.5063705444335938, 0.52197265625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 5.0, 1.0, 6.0, 6.0, 9.0, 15.0, 21.0, 34.0, 47.0, 73.0, 76.0, 118.0, 136.0, 118.0, 102.0, 76.0, 54.0, 27.0, 19.0, 14.0, 12.0, 6.0, 6.0, 10.0, 4.0, 4.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.6337890625, -0.6131668090820312, -0.5925445556640625, -0.5719223022460938, -0.551300048828125, -0.5306777954101562, -0.5100555419921875, -0.48943328857421875, -0.46881103515625, -0.44818878173828125, -0.4275665283203125, -0.40694427490234375, -0.386322021484375, -0.36569976806640625, -0.3450775146484375, -0.32445526123046875, -0.3038330078125, -0.28321075439453125, -0.2625885009765625, -0.24196624755859375, -0.221343994140625, -0.20072174072265625, -0.1800994873046875, -0.15947723388671875, -0.13885498046875, -0.11823272705078125, -0.0976104736328125, -0.07698822021484375, -0.056365966796875, -0.03574371337890625, -0.0151214599609375, 0.00550079345703125, 0.026123046875, 0.04674530029296875, 0.0673675537109375, 0.08798980712890625, 0.108612060546875, 0.12923431396484375, 0.1498565673828125, 0.17047882080078125, 0.19110107421875, 0.21172332763671875, 0.2323455810546875, 0.25296783447265625, 0.273590087890625, 0.29421234130859375, 0.3148345947265625, 0.33545684814453125, 0.3560791015625, 0.37670135498046875, 0.3973236083984375, 0.41794586181640625, 0.438568115234375, 0.45919036865234375, 0.4798126220703125, 0.5004348754882812, 0.52105712890625, 0.5416793823242188, 0.5623016357421875, 0.5829238891601562, 0.603546142578125, 0.6241683959960938, 0.6447906494140625, 0.6654129028320312, 0.68603515625]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 6.0, 1.0, 3.0, 12.0, 7.0, 27.0, 114.0, 391.0, 315.0, 69.0, 30.0, 8.0, 6.0, 5.0, 4.0, 1.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-12.18556022644043, -11.925686836242676, -11.665812492370605, -11.405939102172852, -11.146064758300781, -10.886191368103027, -10.626317977905273, -10.366443634033203, -10.10657024383545, -9.846696853637695, -9.586822509765625, -9.326949119567871, -9.0670747756958, -8.807201385498047, -8.547327041625977, -8.287453651428223, -8.027580261230469, -7.767706394195557, -7.5078325271606445, -7.247959136962891, -6.9880852699279785, -6.728211402893066, -6.468337535858154, -6.208463668823242, -5.948589324951172, -5.68871545791626, -5.428841590881348, -5.168968200683594, -4.909094333648682, -4.6492204666137695, -4.389346599578857, -4.129472732543945, -3.8695998191833496, -3.6097259521484375, -3.3498523235321045, -3.0899784564971924, -2.8301048278808594, -2.5702309608459473, -2.310357093811035, -2.050483226776123, -1.79060959815979, -1.5307358503341675, -1.270862102508545, -1.0109882354736328, -0.7511144876480103, -0.4912407398223877, -0.23136687278747559, 0.028506875038146973, 0.28838062286376953, 0.5482543706893921, 0.8081281781196594, 1.0680019855499268, 1.3278757333755493, 1.5877494812011719, 1.847623348236084, 2.107497215270996, 2.367370843887329, 2.627244710922241, 2.887118339538574, 3.1469922065734863, 3.4068660736083984, 3.6667397022247314, 3.9266135692596436, 4.186487197875977, 4.446361064910889]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 2.0, 2.0, 4.0, 2.0, 7.0, 5.0, 8.0, 8.0, 15.0, 19.0, 12.0, 36.0, 63.0, 100.0, 106.0, 159.0, 138.0, 115.0, 68.0, 37.0, 21.0, 15.0, 9.0, 6.0, 4.0, 5.0, 3.0, 6.0, 3.0, 5.0, 2.0, 2.0, 2.0, 1.0, 2.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.108667373657227, -8.811705589294434, -8.514742851257324, -8.217781066894531, -7.92081880569458, -7.623856544494629, -7.326894760131836, -7.029932498931885, -6.732970237731934, -6.436007976531982, -6.1390461921691895, -5.842083930969238, -5.545121669769287, -5.248159408569336, -4.951197624206543, -4.654235363006592, -4.357273578643799, -4.060311317443848, -3.7633492946624756, -3.4663872718811035, -3.1694250106811523, -2.8724629878997803, -2.575500965118408, -2.278538703918457, -1.981576681137085, -1.6846145391464233, -1.3876523971557617, -1.0906903743743896, -0.793728232383728, -0.4967660903930664, -0.19980406761169434, 0.09715819358825684, 0.3941202163696289, 0.6910823583602905, 0.9880444407463074, 1.2850065231323242, 1.5819686651229858, 1.8789308071136475, 2.1758928298950195, 2.4728550910949707, 2.7698171138763428, 3.066779136657715, 3.363741397857666, 3.660703420639038, 3.95766544342041, 4.254627704620361, 4.5515899658203125, 4.8485517501831055, 5.145514011383057, 5.442476272583008, 5.739438056945801, 6.036400318145752, 6.333362579345703, 6.630324363708496, 6.927286624908447, 7.224248886108398, 7.521210670471191, 7.818172931671143, 8.115135192871094, 8.412096977233887, 8.70905876159668, 9.006021499633789, 9.302983283996582, 9.599945068359375, 9.896907806396484]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 3.0, 7.0, 11.0, 10.0, 12.0, 13.0, 24.0, 23.0, 34.0, 46.0, 72.0, 80.0, 101.0, 155.0, 224.0, 328.0, 448.0, 692.0, 1100.0, 1722.0, 3172.0, 5849.0, 14264.0, 52684.0, 3512929.0, 524048.0, 44905.0, 14708.0, 6866.0, 3562.0, 2232.0, 1361.0, 875.0, 555.0, 368.0, 251.0, 162.0, 140.0, 69.0, 58.0, 35.0, 33.0, 10.0, 12.0, 14.0, 5.0, 2.0, 5.0, 1.0, 1.0, 4.0], "bins": [-1.1318359375, -1.1019744873046875, -1.072113037109375, -1.0422515869140625, -1.01239013671875, -0.9825286865234375, -0.952667236328125, -0.9228057861328125, -0.8929443359375, -0.8630828857421875, -0.833221435546875, -0.8033599853515625, -0.77349853515625, -0.7436370849609375, -0.713775634765625, -0.6839141845703125, -0.654052734375, -0.6241912841796875, -0.594329833984375, -0.5644683837890625, -0.53460693359375, -0.5047454833984375, -0.474884033203125, -0.4450225830078125, -0.4151611328125, -0.3852996826171875, -0.355438232421875, -0.3255767822265625, -0.29571533203125, -0.2658538818359375, -0.235992431640625, -0.2061309814453125, -0.17626953125, -0.1464080810546875, -0.116546630859375, -0.0866851806640625, -0.05682373046875, -0.0269622802734375, 0.002899169921875, 0.0327606201171875, 0.0626220703125, 0.0924835205078125, 0.122344970703125, 0.1522064208984375, 0.18206787109375, 0.2119293212890625, 0.241790771484375, 0.2716522216796875, 0.301513671875, 0.3313751220703125, 0.361236572265625, 0.3910980224609375, 0.42095947265625, 0.4508209228515625, 0.480682373046875, 0.5105438232421875, 0.5404052734375, 0.5702667236328125, 0.600128173828125, 0.6299896240234375, 0.65985107421875, 0.6897125244140625, 0.719573974609375, 0.7494354248046875, 0.779296875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 5.0, 0.0, 4.0, 6.0, 4.0, 3.0, 4.0, 3.0, 6.0, 12.0, 12.0, 19.0, 22.0, 54.0, 192.0, 355.0, 164.0, 36.0, 21.0, 7.0, 7.0, 10.0, 10.0, 8.0, 2.0, 3.0, 8.0, 6.0, 5.0, 6.0, 3.0, 6.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.1473388671875, -0.14342117309570312, -0.13950347900390625, -0.13558578491210938, -0.1316680908203125, -0.12775039672851562, -0.12383270263671875, -0.11991500854492188, -0.115997314453125, -0.11207962036132812, -0.10816192626953125, -0.10424423217773438, -0.1003265380859375, -0.09640884399414062, -0.09249114990234375, -0.08857345581054688, -0.08465576171875, -0.08073806762695312, -0.07682037353515625, -0.07290267944335938, -0.0689849853515625, -0.06506729125976562, -0.06114959716796875, -0.057231903076171875, -0.053314208984375, -0.049396514892578125, -0.04547882080078125, -0.041561126708984375, -0.0376434326171875, -0.033725738525390625, -0.02980804443359375, -0.025890350341796875, -0.02197265625, -0.018054962158203125, -0.01413726806640625, -0.010219573974609375, -0.0063018798828125, -0.002384185791015625, 0.00153350830078125, 0.005451202392578125, 0.009368896484375, 0.013286590576171875, 0.01720428466796875, 0.021121978759765625, 0.0250396728515625, 0.028957366943359375, 0.03287506103515625, 0.036792755126953125, 0.04071044921875, 0.044628143310546875, 0.04854583740234375, 0.052463531494140625, 0.0563812255859375, 0.060298919677734375, 0.06421661376953125, 0.06813430786132812, 0.072052001953125, 0.07596969604492188, 0.07988739013671875, 0.08380508422851562, 0.0877227783203125, 0.09164047241210938, 0.09555816650390625, 0.09947586059570312, 0.1033935546875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 7.0, 1.0, 10.0, 12.0, 11.0, 19.0, 20.0, 33.0, 56.0, 69.0, 122.0, 186.0, 333.0, 571.0, 1024.0, 2258.0, 5739.0, 18919.0, 108892.0, 3365410.0, 625314.0, 46345.0, 11059.0, 3871.0, 1784.0, 845.0, 503.0, 313.0, 211.0, 99.0, 59.0, 46.0, 46.0, 21.0, 21.0, 11.0, 10.0, 10.0, 6.0, 6.0, 2.0, 3.0, 5.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4658203125, -0.44775390625, -0.4296875, -0.41162109375, -0.3935546875, -0.37548828125, -0.357421875, -0.33935546875, -0.3212890625, -0.30322265625, -0.28515625, -0.26708984375, -0.2490234375, -0.23095703125, -0.212890625, -0.19482421875, -0.1767578125, -0.15869140625, -0.140625, -0.12255859375, -0.1044921875, -0.08642578125, -0.068359375, -0.05029296875, -0.0322265625, -0.01416015625, 0.00390625, 0.02197265625, 0.0400390625, 0.05810546875, 0.076171875, 0.09423828125, 0.1123046875, 0.13037109375, 0.1484375, 0.16650390625, 0.1845703125, 0.20263671875, 0.220703125, 0.23876953125, 0.2568359375, 0.27490234375, 0.29296875, 0.31103515625, 0.3291015625, 0.34716796875, 0.365234375, 0.38330078125, 0.4013671875, 0.41943359375, 0.4375, 0.45556640625, 0.4736328125, 0.49169921875, 0.509765625, 0.52783203125, 0.5458984375, 0.56396484375, 0.58203125, 0.60009765625, 0.6181640625, 0.63623046875, 0.654296875, 0.67236328125, 0.6904296875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 3.0, 3.0, 6.0, 6.0, 7.0, 9.0, 12.0, 19.0, 27.0, 26.0, 48.0, 107.0, 234.0, 527.0, 1598.0, 780.0, 282.0, 137.0, 82.0, 45.0, 30.0, 17.0, 20.0, 11.0, 11.0, 9.0, 7.0, 2.0, 6.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.146240234375, -0.1413249969482422, -0.13640975952148438, -0.13149452209472656, -0.12657928466796875, -0.12166404724121094, -0.11674880981445312, -0.11183357238769531, -0.1069183349609375, -0.10200309753417969, -0.09708786010742188, -0.09217262268066406, -0.08725738525390625, -0.08234214782714844, -0.07742691040039062, -0.07251167297363281, -0.067596435546875, -0.06268119812011719, -0.057765960693359375, -0.05285072326660156, -0.04793548583984375, -0.04302024841308594, -0.038105010986328125, -0.03318977355957031, -0.0282745361328125, -0.023359298706054688, -0.018444061279296875, -0.013528823852539062, -0.00861358642578125, -0.0036983489990234375, 0.001216888427734375, 0.0061321258544921875, 0.01104736328125, 0.015962600708007812, 0.020877838134765625, 0.025793075561523438, 0.03070831298828125, 0.03562355041503906, 0.040538787841796875, 0.04545402526855469, 0.0503692626953125, 0.05528450012207031, 0.060199737548828125, 0.06511497497558594, 0.07003021240234375, 0.07494544982910156, 0.07986068725585938, 0.08477592468261719, 0.089691162109375, 0.09460639953613281, 0.09952163696289062, 0.10443687438964844, 0.10935211181640625, 0.11426734924316406, 0.11918258666992188, 0.12409782409667969, 0.1290130615234375, 0.1339282989501953, 0.13884353637695312, 0.14375877380371094, 0.14867401123046875, 0.15358924865722656, 0.15850448608398438, 0.1634197235107422, 0.1683349609375]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 1.0, 7.0, 17.0, 81.0, 394.0, 403.0, 65.0, 20.0, 3.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.229240894317627, -1.1784467697143555, -1.127652645111084, -1.0768585205078125, -1.0260645151138306, -0.9752703905105591, -0.9244762659072876, -0.8736821413040161, -0.8228880763053894, -0.7720939517021179, -0.7212998867034912, -0.6705057621002197, -0.6197116374969482, -0.5689175724983215, -0.51812344789505, -0.46732935309410095, -0.41653525829315186, -0.36574116349220276, -0.31494706869125366, -0.2641529440879822, -0.21335884928703308, -0.16256475448608398, -0.1117706298828125, -0.0609765350818634, -0.010182440280914307, 0.04061166197061539, 0.09140576422214508, 0.14219987392425537, 0.19299396872520447, 0.24378806352615356, 0.29458218812942505, 0.34537628293037415, 0.39617037773132324, 0.44696447253227234, 0.49775856733322144, 0.5485526919364929, 0.5993467569351196, 0.6501408815383911, 0.7009350061416626, 0.7517291307449341, 0.8025231957435608, 0.8533173203468323, 0.904111385345459, 0.9549055099487305, 1.005699634552002, 1.0564937591552734, 1.107287883758545, 1.1580818891525269, 1.2088760137557983, 1.2596701383590698, 1.3104642629623413, 1.3612582683563232, 1.4120523929595947, 1.4628465175628662, 1.5136406421661377, 1.5644347667694092, 1.6152288913726807, 1.6660230159759521, 1.7168171405792236, 1.7676112651824951, 1.818405270576477, 1.8691993951797485, 1.91999351978302, 1.9707876443862915, 2.0215816497802734]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 3.0, 4.0, 4.0, 2.0, 4.0, 4.0, 9.0, 16.0, 6.0, 20.0, 32.0, 50.0, 49.0, 55.0, 88.0, 91.0, 102.0, 92.0, 92.0, 73.0, 54.0, 58.0, 20.0, 20.0, 22.0, 14.0, 6.0, 3.0, 5.0, 3.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.8361510038375854, -0.8090371489524841, -0.7819233536720276, -0.7548094987869263, -0.727695643901825, -0.7005817890167236, -0.6734679937362671, -0.6463541388511658, -0.6192402839660645, -0.5921264290809631, -0.5650126338005066, -0.5378987789154053, -0.510784924030304, -0.483671098947525, -0.4565572738647461, -0.4294434189796448, -0.40232962369918823, -0.3752157986164093, -0.348101943731308, -0.32098811864852905, -0.29387426376342773, -0.2667604386806488, -0.23964661359786987, -0.21253277361392975, -0.18541893362998962, -0.1583050936460495, -0.13119125366210938, -0.10407742857933044, -0.07696358859539032, -0.049849748611450195, -0.022735923528671265, 0.00437791645526886, 0.03149169683456421, 0.058605533093214035, 0.08571936935186386, 0.11283320188522339, 0.1399470418691635, 0.16706088185310364, 0.19417470693588257, 0.2212885469198227, 0.24840238690376282, 0.27551621198654175, 0.30263006687164307, 0.329743891954422, 0.3568577170372009, 0.38397157192230225, 0.4110853970050812, 0.4381992220878601, 0.4653130769729614, 0.49242690205574036, 0.5195407271385193, 0.5466545820236206, 0.5737684369087219, 0.6008822917938232, 0.6279960870742798, 0.6551099419593811, 0.6822237968444824, 0.7093376517295837, 0.7364514470100403, 0.7635653018951416, 0.7906791567802429, 0.8177930116653442, 0.8449068069458008, 0.8720206618309021, 0.8991344571113586]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 5.0, 3.0, 12.0, 10.0, 17.0, 15.0, 32.0, 50.0, 86.0, 102.0, 136.0, 255.0, 383.0, 620.0, 1151.0, 2107.0, 4033.0, 8214.0, 18547.0, 56435.0, 761295.0, 146336.0, 26272.0, 10862.0, 5305.0, 2658.0, 1424.0, 824.0, 459.0, 323.0, 183.0, 120.0, 86.0, 63.0, 37.0, 29.0, 18.0, 14.0, 13.0, 7.0, 3.0, 4.0, 2.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.7265625, -0.7050018310546875, -0.683441162109375, -0.6618804931640625, -0.64031982421875, -0.6187591552734375, -0.597198486328125, -0.5756378173828125, -0.5540771484375, -0.5325164794921875, -0.510955810546875, -0.4893951416015625, -0.46783447265625, -0.4462738037109375, -0.424713134765625, -0.4031524658203125, -0.381591796875, -0.3600311279296875, -0.338470458984375, -0.3169097900390625, -0.29534912109375, -0.2737884521484375, -0.252227783203125, -0.2306671142578125, -0.2091064453125, -0.1875457763671875, -0.165985107421875, -0.1444244384765625, -0.12286376953125, -0.1013031005859375, -0.079742431640625, -0.0581817626953125, -0.03662109375, -0.0150604248046875, 0.006500244140625, 0.0280609130859375, 0.04962158203125, 0.0711822509765625, 0.092742919921875, 0.1143035888671875, 0.1358642578125, 0.1574249267578125, 0.178985595703125, 0.2005462646484375, 0.22210693359375, 0.2436676025390625, 0.265228271484375, 0.2867889404296875, 0.308349609375, 0.3299102783203125, 0.351470947265625, 0.3730316162109375, 0.39459228515625, 0.4161529541015625, 0.437713623046875, 0.4592742919921875, 0.4808349609375, 0.5023956298828125, 0.523956298828125, 0.5455169677734375, 0.56707763671875, 0.5886383056640625, 0.610198974609375, 0.6317596435546875, 0.6533203125]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 4.0, 2.0, 3.0, 3.0, 9.0, 5.0, 18.0, 18.0, 19.0, 35.0, 100.0, 223.0, 279.0, 134.0, 51.0, 14.0, 18.0, 10.0, 5.0, 10.0, 7.0, 9.0, 4.0, 5.0, 3.0, 8.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1492919921875, -0.1454010009765625, -0.141510009765625, -0.1376190185546875, -0.13372802734375, -0.1298370361328125, -0.125946044921875, -0.1220550537109375, -0.1181640625, -0.1142730712890625, -0.110382080078125, -0.1064910888671875, -0.10260009765625, -0.0987091064453125, -0.094818115234375, -0.0909271240234375, -0.0870361328125, -0.0831451416015625, -0.079254150390625, -0.0753631591796875, -0.07147216796875, -0.0675811767578125, -0.063690185546875, -0.0597991943359375, -0.055908203125, -0.0520172119140625, -0.048126220703125, -0.0442352294921875, -0.04034423828125, -0.0364532470703125, -0.032562255859375, -0.0286712646484375, -0.0247802734375, -0.0208892822265625, -0.016998291015625, -0.0131072998046875, -0.00921630859375, -0.0053253173828125, -0.001434326171875, 0.0024566650390625, 0.00634765625, 0.0102386474609375, 0.014129638671875, 0.0180206298828125, 0.02191162109375, 0.0258026123046875, 0.029693603515625, 0.0335845947265625, 0.0374755859375, 0.0413665771484375, 0.045257568359375, 0.0491485595703125, 0.05303955078125, 0.0569305419921875, 0.060821533203125, 0.0647125244140625, 0.068603515625, 0.0724945068359375, 0.076385498046875, 0.0802764892578125, 0.08416748046875, 0.0880584716796875, 0.091949462890625, 0.0958404541015625, 0.0997314453125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 2.0, 7.0, 17.0, 38.0, 62.0, 176.0, 467.0, 1540.0, 7630.0, 77468.0, 804403.0, 142914.0, 10891.0, 1990.0, 576.0, 183.0, 86.0, 48.0, 14.0, 12.0, 9.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.76025390625, -0.7361984252929688, -0.7121429443359375, -0.6880874633789062, -0.664031982421875, -0.6399765014648438, -0.6159210205078125, -0.5918655395507812, -0.56781005859375, -0.5437545776367188, -0.5196990966796875, -0.49564361572265625, -0.471588134765625, -0.44753265380859375, -0.4234771728515625, -0.39942169189453125, -0.3753662109375, -0.35131072998046875, -0.3272552490234375, -0.30319976806640625, -0.279144287109375, -0.25508880615234375, -0.2310333251953125, -0.20697784423828125, -0.18292236328125, -0.15886688232421875, -0.1348114013671875, -0.11075592041015625, -0.086700439453125, -0.06264495849609375, -0.0385894775390625, -0.01453399658203125, 0.009521484375, 0.03357696533203125, 0.0576324462890625, 0.08168792724609375, 0.105743408203125, 0.12979888916015625, 0.1538543701171875, 0.17790985107421875, 0.20196533203125, 0.22602081298828125, 0.2500762939453125, 0.27413177490234375, 0.298187255859375, 0.32224273681640625, 0.3462982177734375, 0.37035369873046875, 0.3944091796875, 0.41846466064453125, 0.4425201416015625, 0.46657562255859375, 0.490631103515625, 0.5146865844726562, 0.5387420654296875, 0.5627975463867188, 0.58685302734375, 0.6109085083007812, 0.6349639892578125, 0.6590194702148438, 0.683074951171875, 0.7071304321289062, 0.7311859130859375, 0.7552413940429688, 0.779296875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 4.0, 3.0, 2.0, 6.0, 9.0, 7.0, 7.0, 17.0, 17.0, 24.0, 32.0, 30.0, 29.0, 20.0, 34.0, 40.0, 34.0, 35.0, 37.0, 43.0, 39.0, 42.0, 53.0, 40.0, 48.0, 42.0, 37.0, 30.0, 34.0, 34.0, 28.0, 33.0, 23.0, 19.0, 9.0, 21.0, 7.0, 12.0, 8.0, 4.0, 3.0, 6.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.341064453125, -0.33090972900390625, -0.3207550048828125, -0.31060028076171875, -0.300445556640625, -0.29029083251953125, -0.2801361083984375, -0.26998138427734375, -0.25982666015625, -0.24967193603515625, -0.2395172119140625, -0.22936248779296875, -0.219207763671875, -0.20905303955078125, -0.1988983154296875, -0.18874359130859375, -0.1785888671875, -0.16843414306640625, -0.1582794189453125, -0.14812469482421875, -0.137969970703125, -0.12781524658203125, -0.1176605224609375, -0.10750579833984375, -0.09735107421875, -0.08719635009765625, -0.0770416259765625, -0.06688690185546875, -0.056732177734375, -0.04657745361328125, -0.0364227294921875, -0.02626800537109375, -0.01611328125, -0.00595855712890625, 0.0041961669921875, 0.01435089111328125, 0.024505615234375, 0.03466033935546875, 0.0448150634765625, 0.05496978759765625, 0.06512451171875, 0.07527923583984375, 0.0854339599609375, 0.09558868408203125, 0.105743408203125, 0.11589813232421875, 0.1260528564453125, 0.13620758056640625, 0.1463623046875, 0.15651702880859375, 0.1666717529296875, 0.17682647705078125, 0.186981201171875, 0.19713592529296875, 0.2072906494140625, 0.21744537353515625, 0.22760009765625, 0.23775482177734375, 0.2479095458984375, 0.25806427001953125, 0.268218994140625, 0.27837371826171875, 0.2885284423828125, 0.29868316650390625, 0.308837890625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 2.0, 2.0, 5.0, 8.0, 7.0, 16.0, 23.0, 39.0, 55.0, 78.0, 132.0, 220.0, 517.0, 1030.0, 2923.0, 13091.0, 270600.0, 733426.0, 20043.0, 3867.0, 1236.0, 554.0, 285.0, 157.0, 82.0, 53.0, 32.0, 18.0, 17.0, 8.0, 8.0, 6.0, 7.0, 4.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.99169921875, -0.9564132690429688, -0.9211273193359375, -0.8858413696289062, -0.850555419921875, -0.8152694702148438, -0.7799835205078125, -0.7446975708007812, -0.70941162109375, -0.6741256713867188, -0.6388397216796875, -0.6035537719726562, -0.568267822265625, -0.5329818725585938, -0.4976959228515625, -0.46240997314453125, -0.4271240234375, -0.39183807373046875, -0.3565521240234375, -0.32126617431640625, -0.285980224609375, -0.25069427490234375, -0.2154083251953125, -0.18012237548828125, -0.14483642578125, -0.10955047607421875, -0.0742645263671875, -0.03897857666015625, -0.003692626953125, 0.03159332275390625, 0.0668792724609375, 0.10216522216796875, 0.137451171875, 0.17273712158203125, 0.2080230712890625, 0.24330902099609375, 0.278594970703125, 0.31388092041015625, 0.3491668701171875, 0.38445281982421875, 0.41973876953125, 0.45502471923828125, 0.4903106689453125, 0.5255966186523438, 0.560882568359375, 0.5961685180664062, 0.6314544677734375, 0.6667404174804688, 0.7020263671875, 0.7373123168945312, 0.7725982666015625, 0.8078842163085938, 0.843170166015625, 0.8784561157226562, 0.9137420654296875, 0.9490280151367188, 0.98431396484375, 1.0195999145507812, 1.0548858642578125, 1.0901718139648438, 1.125457763671875, 1.1607437133789062, 1.1960296630859375, 1.2313156127929688, 1.2666015625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 5.0, 5.0, 4.0, 9.0, 13.0, 12.0, 19.0, 34.0, 64.0, 104.0, 139.0, 184.0, 159.0, 86.0, 53.0, 30.0, 31.0, 14.0, 13.0, 6.0, 6.0, 6.0, 1.0, 1.0, 1.0, 1.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00019431114196777344, -0.0001881122589111328, -0.0001819133758544922, -0.00017571449279785156, -0.00016951560974121094, -0.0001633167266845703, -0.0001571178436279297, -0.00015091896057128906, -0.00014472007751464844, -0.0001385211944580078, -0.0001323223114013672, -0.00012612342834472656, -0.00011992454528808594, -0.00011372566223144531, -0.00010752677917480469, -0.00010132789611816406, -9.512901306152344e-05, -8.893013000488281e-05, -8.273124694824219e-05, -7.653236389160156e-05, -7.033348083496094e-05, -6.413459777832031e-05, -5.793571472167969e-05, -5.173683166503906e-05, -4.553794860839844e-05, -3.933906555175781e-05, -3.314018249511719e-05, -2.6941299438476562e-05, -2.0742416381835938e-05, -1.4543533325195312e-05, -8.344650268554688e-06, -2.1457672119140625e-06, 4.0531158447265625e-06, 1.0251998901367188e-05, 1.6450881958007812e-05, 2.2649765014648438e-05, 2.8848648071289062e-05, 3.504753112792969e-05, 4.124641418457031e-05, 4.744529724121094e-05, 5.364418029785156e-05, 5.984306335449219e-05, 6.604194641113281e-05, 7.224082946777344e-05, 7.843971252441406e-05, 8.463859558105469e-05, 9.083747863769531e-05, 9.703636169433594e-05, 0.00010323524475097656, 0.00010943412780761719, 0.00011563301086425781, 0.00012183189392089844, 0.00012803077697753906, 0.0001342296600341797, 0.0001404285430908203, 0.00014662742614746094, 0.00015282630920410156, 0.0001590251922607422, 0.0001652240753173828, 0.00017142295837402344, 0.00017762184143066406, 0.0001838207244873047, 0.0001900196075439453, 0.00019621849060058594, 0.00020241737365722656]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 4.0, 3.0, 8.0, 3.0, 7.0, 14.0, 16.0, 28.0, 40.0, 50.0, 86.0, 165.0, 303.0, 617.0, 1578.0, 4605.0, 18589.0, 160209.0, 769605.0, 73949.0, 12342.0, 3543.0, 1334.0, 616.0, 335.0, 180.0, 99.0, 69.0, 48.0, 33.0, 24.0, 18.0, 6.0, 7.0, 6.0, 4.0, 6.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5087890625, -0.48947906494140625, -0.4701690673828125, -0.45085906982421875, -0.431549072265625, -0.41223907470703125, -0.3929290771484375, -0.37361907958984375, -0.35430908203125, -0.33499908447265625, -0.3156890869140625, -0.29637908935546875, -0.277069091796875, -0.25775909423828125, -0.2384490966796875, -0.21913909912109375, -0.1998291015625, -0.18051910400390625, -0.1612091064453125, -0.14189910888671875, -0.122589111328125, -0.10327911376953125, -0.0839691162109375, -0.06465911865234375, -0.04534912109375, -0.02603912353515625, -0.0067291259765625, 0.01258087158203125, 0.031890869140625, 0.05120086669921875, 0.0705108642578125, 0.08982086181640625, 0.109130859375, 0.12844085693359375, 0.1477508544921875, 0.16706085205078125, 0.186370849609375, 0.20568084716796875, 0.2249908447265625, 0.24430084228515625, 0.26361083984375, 0.28292083740234375, 0.3022308349609375, 0.32154083251953125, 0.340850830078125, 0.36016082763671875, 0.3794708251953125, 0.39878082275390625, 0.4180908203125, 0.43740081787109375, 0.4567108154296875, 0.47602081298828125, 0.495330810546875, 0.5146408081054688, 0.5339508056640625, 0.5532608032226562, 0.57257080078125, 0.5918807983398438, 0.6111907958984375, 0.6305007934570312, 0.649810791015625, 0.6691207885742188, 0.6884307861328125, 0.7077407836914062, 0.72705078125]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 0.0, 4.0, 1.0, 5.0, 5.0, 4.0, 4.0, 5.0, 2.0, 13.0, 10.0, 17.0, 29.0, 38.0, 33.0, 63.0, 91.0, 98.0, 103.0, 116.0, 88.0, 66.0, 47.0, 37.0, 29.0, 20.0, 14.0, 23.0, 8.0, 3.0, 6.0, 7.0, 4.0, 4.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.361083984375, -0.3465080261230469, -0.33193206787109375, -0.3173561096191406, -0.3027801513671875, -0.2882041931152344, -0.27362823486328125, -0.2590522766113281, -0.244476318359375, -0.22990036010742188, -0.21532440185546875, -0.20074844360351562, -0.1861724853515625, -0.17159652709960938, -0.15702056884765625, -0.14244461059570312, -0.12786865234375, -0.11329269409179688, -0.09871673583984375, -0.08414077758789062, -0.0695648193359375, -0.054988861083984375, -0.04041290283203125, -0.025836944580078125, -0.011260986328125, 0.003314971923828125, 0.01789093017578125, 0.032466888427734375, 0.0470428466796875, 0.061618804931640625, 0.07619476318359375, 0.09077072143554688, 0.1053466796875, 0.11992263793945312, 0.13449859619140625, 0.14907455444335938, 0.1636505126953125, 0.17822647094726562, 0.19280242919921875, 0.20737838745117188, 0.221954345703125, 0.23653030395507812, 0.25110626220703125, 0.2656822204589844, 0.2802581787109375, 0.2948341369628906, 0.30941009521484375, 0.3239860534667969, 0.33856201171875, 0.3531379699707031, 0.36771392822265625, 0.3822898864746094, 0.3968658447265625, 0.4114418029785156, 0.42601776123046875, 0.4405937194824219, 0.455169677734375, 0.4697456359863281, 0.48432159423828125, 0.4988975524902344, 0.5134735107421875, 0.5280494689941406, 0.5426254272460938, 0.5572013854980469, 0.57177734375]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 7.0, 16.0, 88.0, 436.0, 381.0, 48.0, 13.0, 10.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.177377223968506, -6.9203948974609375, -6.663412094116211, -6.406429767608643, -6.149447441101074, -5.892464637756348, -5.635482311248779, -5.378499984741211, -5.121517181396484, -4.864534854888916, -4.6075520515441895, -4.350569725036621, -4.093587398529053, -3.8366048336029053, -3.579622268676758, -3.3226399421691895, -3.065657615661621, -2.8086750507354736, -2.5516927242279053, -2.294710159301758, -2.0377278327941895, -1.780745267868042, -1.5237627029418945, -1.2667802572250366, -1.0097978115081787, -0.7528153657913208, -0.4958328604698181, -0.23885035514831543, 0.01813209056854248, 0.2751145362854004, 0.5320971012115479, 0.7890795469284058, 1.0460624694824219, 1.3030449151992798, 1.5600273609161377, 1.8170099258422852, 2.0739922523498535, 2.330974817276001, 2.5879573822021484, 2.844939708709717, 3.1019222736358643, 3.3589048385620117, 3.61588716506958, 3.8728697299957275, 4.129852294921875, 4.386834621429443, 4.643816947937012, 4.900799751281738, 5.157782077789307, 5.414764404296875, 5.671747207641602, 5.92872953414917, 6.185711860656738, 6.442694664001465, 6.699676990509033, 6.956659317016602, 7.213642120361328, 7.4706244468688965, 7.727607250213623, 7.984589576721191, 8.241572380065918, 8.498554229736328, 8.755537033081055, 9.012519836425781, 9.269501686096191]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 5.0, 9.0, 7.0, 13.0, 24.0, 25.0, 52.0, 72.0, 76.0, 95.0, 111.0, 137.0, 93.0, 80.0, 58.0, 49.0, 24.0, 18.0, 11.0, 14.0, 3.0, 7.0, 5.0, 2.0, 5.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.342592239379883, -4.184720516204834, -4.026848793029785, -3.8689773082733154, -3.7111055850982666, -3.5532338619232178, -3.395362377166748, -3.237490653991699, -3.0796189308166504, -2.9217472076416016, -2.7638754844665527, -2.606003999710083, -2.448132276535034, -2.2902605533599854, -2.1323890686035156, -1.9745173454284668, -1.816645622253418, -1.6587738990783691, -1.5009022951126099, -1.3430306911468506, -1.1851589679718018, -1.027287244796753, -0.8694156408309937, -0.7115440368652344, -0.5536723136901855, -0.3958006501197815, -0.23792898654937744, -0.08005732297897339, 0.07781434059143066, 0.23568600416183472, 0.39355766773223877, 0.551429271697998, 0.7093014717102051, 0.8671731352806091, 1.0250447988510132, 1.1829164028167725, 1.3407881259918213, 1.4986598491668701, 1.6565314531326294, 1.8144030570983887, 1.9722747802734375, 2.1301465034484863, 2.288018226623535, 2.445889711380005, 2.6037614345550537, 2.7616331577301025, 2.9195046424865723, 3.077376365661621, 3.23524808883667, 3.3931198120117188, 3.5509915351867676, 3.7088630199432373, 3.866734743118286, 4.024606227874756, 4.182477951049805, 4.3403496742248535, 4.498221397399902, 4.656093120574951, 4.81396484375, 4.971836566925049, 5.129708290100098, 5.287579536437988, 5.445451259613037, 5.603322982788086, 5.761194705963135]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 7.0, 2.0, 8.0, 9.0, 6.0, 14.0, 7.0, 8.0, 12.0, 13.0, 22.0, 18.0, 24.0, 28.0, 40.0, 57.0, 114.0, 138.0, 198.0, 318.0, 573.0, 1059.0, 2154.0, 6703.0, 45841.0, 4052735.0, 68540.0, 8644.0, 3020.0, 1545.0, 870.0, 554.0, 370.0, 210.0, 129.0, 92.0, 65.0, 44.0, 24.0, 20.0, 17.0, 15.0, 11.0, 5.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.388671875, -2.3250732421875, -2.261474609375, -2.1978759765625, -2.13427734375, -2.0706787109375, -2.007080078125, -1.9434814453125, -1.8798828125, -1.8162841796875, -1.752685546875, -1.6890869140625, -1.62548828125, -1.5618896484375, -1.498291015625, -1.4346923828125, -1.37109375, -1.3074951171875, -1.243896484375, -1.1802978515625, -1.11669921875, -1.0531005859375, -0.989501953125, -0.9259033203125, -0.8623046875, -0.7987060546875, -0.735107421875, -0.6715087890625, -0.60791015625, -0.5443115234375, -0.480712890625, -0.4171142578125, -0.353515625, -0.2899169921875, -0.226318359375, -0.1627197265625, -0.09912109375, -0.0355224609375, 0.028076171875, 0.0916748046875, 0.1552734375, 0.2188720703125, 0.282470703125, 0.3460693359375, 0.40966796875, 0.4732666015625, 0.536865234375, 0.6004638671875, 0.6640625, 0.7276611328125, 0.791259765625, 0.8548583984375, 0.91845703125, 0.9820556640625, 1.045654296875, 1.1092529296875, 1.1728515625, 1.2364501953125, 1.300048828125, 1.3636474609375, 1.42724609375, 1.4908447265625, 1.554443359375, 1.6180419921875, 1.681640625]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 4.0, 7.0, 5.0, 6.0, 8.0, 18.0, 28.0, 58.0, 131.0, 248.0, 234.0, 114.0, 50.0, 25.0, 11.0, 9.0, 10.0, 11.0, 6.0, 5.0, 4.0, 6.0, 6.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1632080078125, -0.15892410278320312, -0.15464019775390625, -0.15035629272460938, -0.1460723876953125, -0.14178848266601562, -0.13750457763671875, -0.13322067260742188, -0.128936767578125, -0.12465286254882812, -0.12036895751953125, -0.11608505249023438, -0.1118011474609375, -0.10751724243164062, -0.10323333740234375, -0.09894943237304688, -0.09466552734375, -0.09038162231445312, -0.08609771728515625, -0.08181381225585938, -0.0775299072265625, -0.07324600219726562, -0.06896209716796875, -0.06467819213867188, -0.060394287109375, -0.056110382080078125, -0.05182647705078125, -0.047542572021484375, -0.0432586669921875, -0.038974761962890625, -0.03469085693359375, -0.030406951904296875, -0.026123046875, -0.021839141845703125, -0.01755523681640625, -0.013271331787109375, -0.0089874267578125, -0.004703521728515625, -0.00041961669921875, 0.003864288330078125, 0.008148193359375, 0.012432098388671875, 0.01671600341796875, 0.020999908447265625, 0.0252838134765625, 0.029567718505859375, 0.03385162353515625, 0.038135528564453125, 0.04241943359375, 0.046703338623046875, 0.05098724365234375, 0.055271148681640625, 0.0595550537109375, 0.06383895874023438, 0.06812286376953125, 0.07240676879882812, 0.076690673828125, 0.08097457885742188, 0.08525848388671875, 0.08954238891601562, 0.0938262939453125, 0.09811019897460938, 0.10239410400390625, 0.10667800903320312, 0.1109619140625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 7.0, 5.0, 9.0, 8.0, 20.0, 21.0, 42.0, 58.0, 149.0, 390.0, 1651.0, 12918.0, 3715095.0, 455434.0, 6872.0, 1037.0, 275.0, 90.0, 55.0, 34.0, 26.0, 18.0, 14.0, 6.0, 6.0, 5.0, 5.0, 5.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-1.58203125, -1.5272674560546875, -1.472503662109375, -1.4177398681640625, -1.36297607421875, -1.3082122802734375, -1.253448486328125, -1.1986846923828125, -1.1439208984375, -1.0891571044921875, -1.034393310546875, -0.9796295166015625, -0.92486572265625, -0.8701019287109375, -0.815338134765625, -0.7605743408203125, -0.705810546875, -0.6510467529296875, -0.596282958984375, -0.5415191650390625, -0.48675537109375, -0.4319915771484375, -0.377227783203125, -0.3224639892578125, -0.2677001953125, -0.2129364013671875, -0.158172607421875, -0.1034088134765625, -0.04864501953125, 0.0061187744140625, 0.060882568359375, 0.1156463623046875, 0.17041015625, 0.2251739501953125, 0.279937744140625, 0.3347015380859375, 0.38946533203125, 0.4442291259765625, 0.498992919921875, 0.5537567138671875, 0.6085205078125, 0.6632843017578125, 0.718048095703125, 0.7728118896484375, 0.82757568359375, 0.8823394775390625, 0.937103271484375, 0.9918670654296875, 1.046630859375, 1.1013946533203125, 1.156158447265625, 1.2109222412109375, 1.26568603515625, 1.3204498291015625, 1.375213623046875, 1.4299774169921875, 1.4847412109375, 1.5395050048828125, 1.594268798828125, 1.6490325927734375, 1.70379638671875, 1.7585601806640625, 1.813323974609375, 1.8680877685546875, 1.9228515625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 3.0, 5.0, 4.0, 5.0, 9.0, 19.0, 28.0, 27.0, 30.0, 52.0, 80.0, 147.0, 248.0, 524.0, 1424.0, 725.0, 294.0, 164.0, 96.0, 42.0, 28.0, 35.0, 15.0, 15.0, 8.0, 6.0, 3.0, 5.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.13720703125, -0.13335227966308594, -0.12949752807617188, -0.1256427764892578, -0.12178802490234375, -0.11793327331542969, -0.11407852172851562, -0.11022377014160156, -0.1063690185546875, -0.10251426696777344, -0.09865951538085938, -0.09480476379394531, -0.09095001220703125, -0.08709526062011719, -0.08324050903320312, -0.07938575744628906, -0.075531005859375, -0.07167625427246094, -0.06782150268554688, -0.06396675109863281, -0.06011199951171875, -0.05625724792480469, -0.052402496337890625, -0.04854774475097656, -0.0446929931640625, -0.04083824157714844, -0.036983489990234375, -0.03312873840332031, -0.02927398681640625, -0.025419235229492188, -0.021564483642578125, -0.017709732055664062, -0.01385498046875, -0.010000228881835938, -0.006145477294921875, -0.0022907257080078125, 0.00156402587890625, 0.0054187774658203125, 0.009273529052734375, 0.013128280639648438, 0.0169830322265625, 0.020837783813476562, 0.024692535400390625, 0.028547286987304688, 0.03240203857421875, 0.03625679016113281, 0.040111541748046875, 0.04396629333496094, 0.047821044921875, 0.05167579650878906, 0.055530548095703125, 0.05938529968261719, 0.06324005126953125, 0.06709480285644531, 0.07094955444335938, 0.07480430603027344, 0.0786590576171875, 0.08251380920410156, 0.08636856079101562, 0.09022331237792969, 0.09407806396484375, 0.09793281555175781, 0.10178756713867188, 0.10564231872558594, 0.1094970703125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 11.0, 21.0, 100.0, 332.0, 404.0, 102.0, 22.0, 1.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4085204601287842, -1.363159418106079, -1.317798376083374, -1.2724374532699585, -1.2270764112472534, -1.1817153692245483, -1.1363543272018433, -1.0909934043884277, -1.0456323623657227, -1.0002713203430176, -0.9549103379249573, -0.9095492959022522, -0.8641883134841919, -0.8188272714614868, -0.7734662294387817, -0.7281052470207214, -0.6827442049980164, -0.6373831629753113, -0.592022180557251, -0.5466611385345459, -0.5013001561164856, -0.4559391140937805, -0.4105781018733978, -0.36521708965301514, -0.31985607743263245, -0.27449506521224976, -0.22913405299186707, -0.18377302587032318, -0.1384120136499405, -0.0930510014295578, -0.047689974308013916, -0.0023289620876312256, 0.043032050132751465, 0.08839306235313416, 0.13375407457351685, 0.17911510169506073, 0.22447611391544342, 0.2698371410369873, 0.31519815325737, 0.3605591654777527, 0.4059201776981354, 0.45128118991851807, 0.49664220213890076, 0.5420032143592834, 0.5873642563819885, 0.6327252388000488, 0.6780862808227539, 0.723447322845459, 0.7688083052635193, 0.8141693472862244, 0.8595303297042847, 0.9048913717269897, 0.95025235414505, 0.9956133961677551, 1.0409743785858154, 1.0863354206085205, 1.1316964626312256, 1.1770575046539307, 1.2224185466766357, 1.2677794694900513, 1.3131405115127563, 1.3585015535354614, 1.4038625955581665, 1.449223518371582, 1.494584560394287]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 2.0, 2.0, 4.0, 1.0, 2.0, 6.0, 3.0, 5.0, 4.0, 6.0, 11.0, 19.0, 19.0, 41.0, 36.0, 28.0, 54.0, 55.0, 59.0, 62.0, 76.0, 69.0, 66.0, 63.0, 65.0, 58.0, 53.0, 28.0, 21.0, 25.0, 13.0, 14.0, 7.0, 5.0, 5.0, 2.0, 4.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.6968783736228943, -0.6789629459381104, -0.6610474586486816, -0.6431320309638977, -0.625216543674469, -0.6073011159896851, -0.5893856287002563, -0.5714702010154724, -0.5535547733306885, -0.5356393456459045, -0.5177238583564758, -0.4998084008693695, -0.4818929433822632, -0.46397751569747925, -0.4460620582103729, -0.4281466007232666, -0.4102311134338379, -0.39231565594673157, -0.37440019845962524, -0.3564847409725189, -0.3385692834854126, -0.32065385580062866, -0.30273839831352234, -0.284822940826416, -0.2669074833393097, -0.24899202585220337, -0.23107656836509705, -0.21316112577915192, -0.1952456682920456, -0.17733021080493927, -0.15941476821899414, -0.14149931073188782, -0.1235838532447815, -0.10566839575767517, -0.08775294572114944, -0.06983749568462372, -0.051922038197517395, -0.03400658071041107, -0.016091130673885345, 0.0018243193626403809, 0.019739776849746704, 0.03765523061156273, 0.055570684373378754, 0.07348613440990448, 0.0914015918970108, 0.10931704938411713, 0.12723249197006226, 0.14514794945716858, 0.1630634069442749, 0.18097886443138123, 0.19889432191848755, 0.21680976450443268, 0.234725221991539, 0.25264066457748413, 0.27055612206459045, 0.2884715795516968, 0.3063870370388031, 0.3243024945259094, 0.34221795201301575, 0.36013340950012207, 0.378048837184906, 0.3959643244743347, 0.41387975215911865, 0.431795209646225, 0.4497106671333313]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 8.0, 8.0, 14.0, 19.0, 30.0, 28.0, 51.0, 102.0, 169.0, 281.0, 522.0, 1119.0, 3155.0, 13213.0, 272523.0, 728066.0, 22177.0, 4185.0, 1431.0, 653.0, 316.0, 176.0, 113.0, 70.0, 39.0, 32.0, 13.0, 12.0, 3.0, 11.0, 3.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.95751953125, -0.9246444702148438, -0.8917694091796875, -0.8588943481445312, -0.826019287109375, -0.7931442260742188, -0.7602691650390625, -0.7273941040039062, -0.69451904296875, -0.6616439819335938, -0.6287689208984375, -0.5958938598632812, -0.563018798828125, -0.5301437377929688, -0.4972686767578125, -0.46439361572265625, -0.4315185546875, -0.39864349365234375, -0.3657684326171875, -0.33289337158203125, -0.300018310546875, -0.26714324951171875, -0.2342681884765625, -0.20139312744140625, -0.16851806640625, -0.13564300537109375, -0.1027679443359375, -0.06989288330078125, -0.037017822265625, -0.00414276123046875, 0.0287322998046875, 0.06160736083984375, 0.094482421875, 0.12735748291015625, 0.1602325439453125, 0.19310760498046875, 0.225982666015625, 0.25885772705078125, 0.2917327880859375, 0.32460784912109375, 0.35748291015625, 0.39035797119140625, 0.4232330322265625, 0.45610809326171875, 0.488983154296875, 0.5218582153320312, 0.5547332763671875, 0.5876083374023438, 0.6204833984375, 0.6533584594726562, 0.6862335205078125, 0.7191085815429688, 0.751983642578125, 0.7848587036132812, 0.8177337646484375, 0.8506088256835938, 0.88348388671875, 0.9163589477539062, 0.9492340087890625, 0.9821090698242188, 1.014984130859375, 1.0478591918945312, 1.0807342529296875, 1.1136093139648438, 1.146484375]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 7.0, 5.0, 4.0, 11.0, 18.0, 52.0, 102.0, 191.0, 225.0, 176.0, 98.0, 49.0, 19.0, 15.0, 10.0, 6.0, 4.0, 1.0, 4.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.15576171875, -0.15161991119384766, -0.1474781036376953, -0.14333629608154297, -0.13919448852539062, -0.13505268096923828, -0.13091087341308594, -0.1267690658569336, -0.12262725830078125, -0.1184854507446289, -0.11434364318847656, -0.11020183563232422, -0.10606002807617188, -0.10191822052001953, -0.09777641296386719, -0.09363460540771484, -0.0894927978515625, -0.08535099029541016, -0.08120918273925781, -0.07706737518310547, -0.07292556762695312, -0.06878376007080078, -0.06464195251464844, -0.060500144958496094, -0.05635833740234375, -0.052216529846191406, -0.04807472229003906, -0.04393291473388672, -0.039791107177734375, -0.03564929962158203, -0.03150749206542969, -0.027365684509277344, -0.023223876953125, -0.019082069396972656, -0.014940261840820312, -0.010798454284667969, -0.006656646728515625, -0.0025148391723632812, 0.0016269683837890625, 0.005768775939941406, 0.00991058349609375, 0.014052391052246094, 0.018194198608398438, 0.02233600616455078, 0.026477813720703125, 0.03061962127685547, 0.03476142883300781, 0.038903236389160156, 0.0430450439453125, 0.047186851501464844, 0.05132865905761719, 0.05547046661376953, 0.059612274169921875, 0.06375408172607422, 0.06789588928222656, 0.0720376968383789, 0.07617950439453125, 0.0803213119506836, 0.08446311950683594, 0.08860492706298828, 0.09274673461914062, 0.09688854217529297, 0.10103034973144531, 0.10517215728759766, 0.10931396484375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 7.0, 5.0, 8.0, 8.0, 21.0, 17.0, 25.0, 40.0, 64.0, 87.0, 120.0, 183.0, 245.0, 463.0, 969.0, 2340.0, 6900.0, 26678.0, 151294.0, 621509.0, 192212.0, 32352.0, 7877.0, 2597.0, 1097.0, 514.0, 316.0, 202.0, 117.0, 89.0, 54.0, 46.0, 21.0, 28.0, 19.0, 8.0, 7.0, 6.0, 1.0, 4.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.48779296875, -0.4723358154296875, -0.456878662109375, -0.4414215087890625, -0.42596435546875, -0.4105072021484375, -0.395050048828125, -0.3795928955078125, -0.3641357421875, -0.3486785888671875, -0.333221435546875, -0.3177642822265625, -0.30230712890625, -0.2868499755859375, -0.271392822265625, -0.2559356689453125, -0.240478515625, -0.2250213623046875, -0.209564208984375, -0.1941070556640625, -0.17864990234375, -0.1631927490234375, -0.147735595703125, -0.1322784423828125, -0.1168212890625, -0.1013641357421875, -0.085906982421875, -0.0704498291015625, -0.05499267578125, -0.0395355224609375, -0.024078369140625, -0.0086212158203125, 0.0068359375, 0.0222930908203125, 0.037750244140625, 0.0532073974609375, 0.06866455078125, 0.0841217041015625, 0.099578857421875, 0.1150360107421875, 0.1304931640625, 0.1459503173828125, 0.161407470703125, 0.1768646240234375, 0.19232177734375, 0.2077789306640625, 0.223236083984375, 0.2386932373046875, 0.254150390625, 0.2696075439453125, 0.285064697265625, 0.3005218505859375, 0.31597900390625, 0.3314361572265625, 0.346893310546875, 0.3623504638671875, 0.3778076171875, 0.3932647705078125, 0.408721923828125, 0.4241790771484375, 0.43963623046875, 0.4550933837890625, 0.470550537109375, 0.4860076904296875, 0.50146484375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 5.0, 2.0, 5.0, 5.0, 10.0, 10.0, 8.0, 13.0, 18.0, 15.0, 20.0, 19.0, 27.0, 41.0, 39.0, 33.0, 46.0, 63.0, 54.0, 48.0, 54.0, 52.0, 61.0, 50.0, 42.0, 42.0, 37.0, 32.0, 25.0, 27.0, 17.0, 23.0, 8.0, 13.0, 11.0, 7.0, 6.0, 6.0, 3.0, 7.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33544921875, -0.324310302734375, -0.31317138671875, -0.302032470703125, -0.2908935546875, -0.279754638671875, -0.26861572265625, -0.257476806640625, -0.246337890625, -0.235198974609375, -0.22406005859375, -0.212921142578125, -0.2017822265625, -0.190643310546875, -0.17950439453125, -0.168365478515625, -0.1572265625, -0.146087646484375, -0.13494873046875, -0.123809814453125, -0.1126708984375, -0.101531982421875, -0.09039306640625, -0.079254150390625, -0.068115234375, -0.056976318359375, -0.04583740234375, -0.034698486328125, -0.0235595703125, -0.012420654296875, -0.00128173828125, 0.009857177734375, 0.02099609375, 0.032135009765625, 0.04327392578125, 0.054412841796875, 0.0655517578125, 0.076690673828125, 0.08782958984375, 0.098968505859375, 0.110107421875, 0.121246337890625, 0.13238525390625, 0.143524169921875, 0.1546630859375, 0.165802001953125, 0.17694091796875, 0.188079833984375, 0.19921875, 0.210357666015625, 0.22149658203125, 0.232635498046875, 0.2437744140625, 0.254913330078125, 0.26605224609375, 0.277191162109375, 0.288330078125, 0.299468994140625, 0.31060791015625, 0.321746826171875, 0.3328857421875, 0.344024658203125, 0.35516357421875, 0.366302490234375, 0.37744140625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 4.0, 6.0, 10.0, 12.0, 23.0, 31.0, 46.0, 87.0, 114.0, 205.0, 489.0, 1186.0, 4336.0, 23151.0, 259922.0, 681340.0, 65290.0, 8715.0, 2122.0, 716.0, 311.0, 156.0, 105.0, 57.0, 40.0, 23.0, 19.0, 11.0, 8.0, 8.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3349609375, -0.32488250732421875, -0.3148040771484375, -0.30472564697265625, -0.294647216796875, -0.28456878662109375, -0.2744903564453125, -0.26441192626953125, -0.25433349609375, -0.24425506591796875, -0.2341766357421875, -0.22409820556640625, -0.214019775390625, -0.20394134521484375, -0.1938629150390625, -0.18378448486328125, -0.1737060546875, -0.16362762451171875, -0.1535491943359375, -0.14347076416015625, -0.133392333984375, -0.12331390380859375, -0.1132354736328125, -0.10315704345703125, -0.09307861328125, -0.08300018310546875, -0.0729217529296875, -0.06284332275390625, -0.052764892578125, -0.04268646240234375, -0.0326080322265625, -0.02252960205078125, -0.012451171875, -0.00237274169921875, 0.0077056884765625, 0.01778411865234375, 0.027862548828125, 0.03794097900390625, 0.0480194091796875, 0.05809783935546875, 0.06817626953125, 0.07825469970703125, 0.0883331298828125, 0.09841156005859375, 0.108489990234375, 0.11856842041015625, 0.1286468505859375, 0.13872528076171875, 0.1488037109375, 0.15888214111328125, 0.1689605712890625, 0.17903900146484375, 0.189117431640625, 0.19919586181640625, 0.2092742919921875, 0.21935272216796875, 0.22943115234375, 0.23950958251953125, 0.2495880126953125, 0.25966644287109375, 0.269744873046875, 0.27982330322265625, 0.2899017333984375, 0.29998016357421875, 0.31005859375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 7.0, 8.0, 5.0, 15.0, 15.0, 14.0, 32.0, 50.0, 50.0, 74.0, 134.0, 176.0, 140.0, 84.0, 55.0, 31.0, 35.0, 23.0, 24.0, 14.0, 10.0, 7.0, 6.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002474784851074219, -0.00024164840579032898, -0.00023581832647323608, -0.0002299882471561432, -0.0002241581678390503, -0.0002183280885219574, -0.0002124980092048645, -0.0002066679298877716, -0.0002008378505706787, -0.00019500777125358582, -0.00018917769193649292, -0.00018334761261940002, -0.00017751753330230713, -0.00017168745398521423, -0.00016585737466812134, -0.00016002729535102844, -0.00015419721603393555, -0.00014836713671684265, -0.00014253705739974976, -0.00013670697808265686, -0.00013087689876556396, -0.00012504681944847107, -0.00011921674013137817, -0.00011338666081428528, -0.00010755658149719238, -0.00010172650218009949, -9.589642286300659e-05, -9.00663435459137e-05, -8.42362642288208e-05, -7.84061849117279e-05, -7.257610559463501e-05, -6.674602627754211e-05, -6.091594696044922e-05, -5.508586764335632e-05, -4.925578832626343e-05, -4.342570900917053e-05, -3.759562969207764e-05, -3.176555037498474e-05, -2.5935471057891846e-05, -2.010539174079895e-05, -1.4275312423706055e-05, -8.44523310661316e-06, -2.6151537895202637e-06, 3.214925527572632e-06, 9.045004844665527e-06, 1.4875084161758423e-05, 2.070516347885132e-05, 2.6535242795944214e-05, 3.236532211303711e-05, 3.8195401430130005e-05, 4.40254807472229e-05, 4.9855560064315796e-05, 5.568563938140869e-05, 6.151571869850159e-05, 6.734579801559448e-05, 7.317587733268738e-05, 7.900595664978027e-05, 8.483603596687317e-05, 9.066611528396606e-05, 9.649619460105896e-05, 0.00010232627391815186, 0.00010815635323524475, 0.00011398643255233765, 0.00011981651186943054, 0.00012564659118652344]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 2.0, 7.0, 1.0, 5.0, 7.0, 7.0, 14.0, 22.0, 26.0, 26.0, 35.0, 59.0, 73.0, 151.0, 235.0, 533.0, 1125.0, 3319.0, 13766.0, 92129.0, 688381.0, 215200.0, 25504.0, 5009.0, 1522.0, 600.0, 329.0, 155.0, 90.0, 66.0, 46.0, 25.0, 14.0, 18.0, 16.0, 12.0, 7.0, 2.0, 6.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33154296875, -0.3222503662109375, -0.312957763671875, -0.3036651611328125, -0.29437255859375, -0.2850799560546875, -0.275787353515625, -0.2664947509765625, -0.2572021484375, -0.2479095458984375, -0.238616943359375, -0.2293243408203125, -0.22003173828125, -0.2107391357421875, -0.201446533203125, -0.1921539306640625, -0.182861328125, -0.1735687255859375, -0.164276123046875, -0.1549835205078125, -0.14569091796875, -0.1363983154296875, -0.127105712890625, -0.1178131103515625, -0.1085205078125, -0.0992279052734375, -0.089935302734375, -0.0806427001953125, -0.07135009765625, -0.0620574951171875, -0.052764892578125, -0.0434722900390625, -0.0341796875, -0.0248870849609375, -0.015594482421875, -0.0063018798828125, 0.00299072265625, 0.0122833251953125, 0.021575927734375, 0.0308685302734375, 0.0401611328125, 0.0494537353515625, 0.058746337890625, 0.0680389404296875, 0.07733154296875, 0.0866241455078125, 0.095916748046875, 0.1052093505859375, 0.114501953125, 0.1237945556640625, 0.133087158203125, 0.1423797607421875, 0.15167236328125, 0.1609649658203125, 0.170257568359375, 0.1795501708984375, 0.1888427734375, 0.1981353759765625, 0.207427978515625, 0.2167205810546875, 0.22601318359375, 0.2353057861328125, 0.244598388671875, 0.2538909912109375, 0.26318359375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 9.0, 5.0, 13.0, 5.0, 9.0, 26.0, 33.0, 32.0, 42.0, 63.0, 66.0, 82.0, 97.0, 79.0, 93.0, 58.0, 70.0, 43.0, 43.0, 25.0, 27.0, 18.0, 12.0, 11.0, 7.0, 12.0, 4.0, 2.0, 3.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1650390625, -0.16072750091552734, -0.1564159393310547, -0.15210437774658203, -0.14779281616210938, -0.14348125457763672, -0.13916969299316406, -0.1348581314086914, -0.13054656982421875, -0.1262350082397461, -0.12192344665527344, -0.11761188507080078, -0.11330032348632812, -0.10898876190185547, -0.10467720031738281, -0.10036563873291016, -0.0960540771484375, -0.09174251556396484, -0.08743095397949219, -0.08311939239501953, -0.07880783081054688, -0.07449626922607422, -0.07018470764160156, -0.0658731460571289, -0.06156158447265625, -0.057250022888183594, -0.05293846130371094, -0.04862689971923828, -0.044315338134765625, -0.04000377655029297, -0.03569221496582031, -0.031380653381347656, -0.027069091796875, -0.022757530212402344, -0.018445968627929688, -0.014134407043457031, -0.009822845458984375, -0.005511283874511719, -0.0011997222900390625, 0.0031118392944335938, 0.00742340087890625, 0.011734962463378906, 0.016046524047851562, 0.02035808563232422, 0.024669647216796875, 0.02898120880126953, 0.03329277038574219, 0.037604331970214844, 0.0419158935546875, 0.046227455139160156, 0.05053901672363281, 0.05485057830810547, 0.059162139892578125, 0.06347370147705078, 0.06778526306152344, 0.0720968246459961, 0.07640838623046875, 0.0807199478149414, 0.08503150939941406, 0.08934307098388672, 0.09365463256835938, 0.09796619415283203, 0.10227775573730469, 0.10658931732177734, 0.11090087890625]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 6.0, 2.0, 6.0, 17.0, 32.0, 86.0, 286.0, 372.0, 137.0, 44.0, 10.0, 5.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6822969913482666, -3.4905805587768555, -3.2988638877868652, -3.107147216796875, -2.915430784225464, -2.7237143516540527, -2.5319976806640625, -2.3402810096740723, -2.148564577102661, -1.9568480253219604, -1.7651314735412598, -1.573414921760559, -1.3816983699798584, -1.1899818181991577, -0.998265266418457, -0.8065487146377563, -0.6148321628570557, -0.423115611076355, -0.2313990592956543, -0.03968250751495361, 0.15203404426574707, 0.34375059604644775, 0.5354671478271484, 0.7271836996078491, 0.9189002513885498, 1.1106168031692505, 1.3023333549499512, 1.4940499067306519, 1.6857664585113525, 1.8774830102920532, 2.069199562072754, 2.260916233062744, 2.4526329040527344, 2.6443495750427246, 2.8360660076141357, 3.027782440185547, 3.219499111175537, 3.4112157821655273, 3.6029322147369385, 3.7946486473083496, 3.98636531829834, 4.17808198928833, 4.36979866027832, 4.561514854431152, 4.753231525421143, 4.944948196411133, 5.136664390563965, 5.328381061553955, 5.520097732543945, 5.7118144035339355, 5.903531074523926, 6.095247268676758, 6.286963939666748, 6.478680610656738, 6.67039680480957, 6.8621134757995605, 7.053830146789551, 7.245546817779541, 7.437263488769531, 7.628979682922363, 7.8206963539123535, 8.012413024902344, 8.204129219055176, 8.395846366882324, 8.587562561035156]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 2.0, 8.0, 6.0, 13.0, 17.0, 16.0, 22.0, 20.0, 30.0, 38.0, 46.0, 41.0, 49.0, 46.0, 49.0, 64.0, 68.0, 79.0, 39.0, 52.0, 58.0, 53.0, 41.0, 23.0, 26.0, 26.0, 20.0, 10.0, 11.0, 10.0, 6.0, 5.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6003174781799316, -2.4959962368011475, -2.3916749954223633, -2.287353992462158, -2.183032751083374, -2.07871150970459, -1.9743902683258057, -1.8700690269470215, -1.7657477855682373, -1.6614265441894531, -1.5571054220199585, -1.4527841806411743, -1.3484629392623901, -1.2441418170928955, -1.1398205757141113, -1.0354993343353271, -0.9311782121658325, -0.8268570303916931, -0.7225357890129089, -0.6182146072387695, -0.5138933658599854, -0.40957218408584595, -0.30525100231170654, -0.20092976093292236, -0.09660857915878296, 0.007712624967098236, 0.11203382909297943, 0.21635502576828003, 0.3206762373447418, 0.4249974489212036, 0.529318630695343, 0.6336398720741272, 0.7379610538482666, 0.842282235622406, 0.9466034770011902, 1.0509246587753296, 1.1552459001541138, 1.2595670223236084, 1.3638882637023926, 1.4682095050811768, 1.572530746459961, 1.6768519878387451, 1.7811731100082397, 1.885494351387024, 1.989815592765808, 2.0941367149353027, 2.198457956314087, 2.302779197692871, 2.407100200653076, 2.5114214420318604, 2.6157426834106445, 2.7200636863708496, 2.824384927749634, 2.928706169128418, 3.033027410507202, 3.1373486518859863, 3.2416698932647705, 3.3459911346435547, 3.450312376022339, 3.554633617401123, 3.658954620361328, 3.7632758617401123, 3.8675971031188965, 3.9719183444976807, 4.076239585876465]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 8.0, 8.0, 22.0, 23.0, 42.0, 87.0, 182.0, 572.0, 4551.0, 4148468.0, 38198.0, 1498.0, 359.0, 119.0, 70.0, 34.0, 18.0, 7.0, 6.0, 6.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.71484375, -5.559326171875, -5.40380859375, -5.248291015625, -5.0927734375, -4.937255859375, -4.78173828125, -4.626220703125, -4.470703125, -4.315185546875, -4.15966796875, -4.004150390625, -3.8486328125, -3.693115234375, -3.53759765625, -3.382080078125, -3.2265625, -3.071044921875, -2.91552734375, -2.760009765625, -2.6044921875, -2.448974609375, -2.29345703125, -2.137939453125, -1.982421875, -1.826904296875, -1.67138671875, -1.515869140625, -1.3603515625, -1.204833984375, -1.04931640625, -0.893798828125, -0.73828125, -0.582763671875, -0.42724609375, -0.271728515625, -0.1162109375, 0.039306640625, 0.19482421875, 0.350341796875, 0.505859375, 0.661376953125, 0.81689453125, 0.972412109375, 1.1279296875, 1.283447265625, 1.43896484375, 1.594482421875, 1.75, 1.905517578125, 2.06103515625, 2.216552734375, 2.3720703125, 2.527587890625, 2.68310546875, 2.838623046875, 2.994140625, 3.149658203125, 3.30517578125, 3.460693359375, 3.6162109375, 3.771728515625, 3.92724609375, 4.082763671875, 4.23828125]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 7.0, 17.0, 19.0, 36.0, 76.0, 109.0, 159.0, 161.0, 145.0, 107.0, 62.0, 43.0, 21.0, 19.0, 4.0, 5.0, 1.0, 5.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1905517578125, -0.1853351593017578, -0.18011856079101562, -0.17490196228027344, -0.16968536376953125, -0.16446876525878906, -0.15925216674804688, -0.1540355682373047, -0.1488189697265625, -0.1436023712158203, -0.13838577270507812, -0.13316917419433594, -0.12795257568359375, -0.12273597717285156, -0.11751937866210938, -0.11230278015136719, -0.107086181640625, -0.10186958312988281, -0.09665298461914062, -0.09143638610839844, -0.08621978759765625, -0.08100318908691406, -0.07578659057617188, -0.07056999206542969, -0.0653533935546875, -0.06013679504394531, -0.054920196533203125, -0.04970359802246094, -0.04448699951171875, -0.03927040100097656, -0.034053802490234375, -0.028837203979492188, -0.02362060546875, -0.018404006958007812, -0.013187408447265625, -0.007970809936523438, -0.00275421142578125, 0.0024623870849609375, 0.007678985595703125, 0.012895584106445312, 0.0181121826171875, 0.023328781127929688, 0.028545379638671875, 0.03376197814941406, 0.03897857666015625, 0.04419517517089844, 0.049411773681640625, 0.05462837219238281, 0.059844970703125, 0.06506156921386719, 0.07027816772460938, 0.07549476623535156, 0.08071136474609375, 0.08592796325683594, 0.09114456176757812, 0.09636116027832031, 0.1015777587890625, 0.10679435729980469, 0.11201095581054688, 0.11722755432128906, 0.12244415283203125, 0.12766075134277344, 0.13287734985351562, 0.1380939483642578, 0.143310546875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 5.0, 11.0, 17.0, 15.0, 11.0, 31.0, 41.0, 65.0, 88.0, 172.0, 320.0, 632.0, 2021.0, 8724.0, 84710.0, 3814387.0, 261276.0, 17020.0, 3038.0, 890.0, 384.0, 176.0, 98.0, 58.0, 36.0, 18.0, 13.0, 9.0, 7.0, 6.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.775390625, -0.7492446899414062, -0.7230987548828125, -0.6969528198242188, -0.670806884765625, -0.6446609497070312, -0.6185150146484375, -0.5923690795898438, -0.56622314453125, -0.5400772094726562, -0.5139312744140625, -0.48778533935546875, -0.461639404296875, -0.43549346923828125, -0.4093475341796875, -0.38320159912109375, -0.3570556640625, -0.33090972900390625, -0.3047637939453125, -0.27861785888671875, -0.252471923828125, -0.22632598876953125, -0.2001800537109375, -0.17403411865234375, -0.14788818359375, -0.12174224853515625, -0.0955963134765625, -0.06945037841796875, -0.043304443359375, -0.01715850830078125, 0.0089874267578125, 0.03513336181640625, 0.061279296875, 0.08742523193359375, 0.1135711669921875, 0.13971710205078125, 0.165863037109375, 0.19200897216796875, 0.2181549072265625, 0.24430084228515625, 0.27044677734375, 0.29659271240234375, 0.3227386474609375, 0.34888458251953125, 0.375030517578125, 0.40117645263671875, 0.4273223876953125, 0.45346832275390625, 0.4796142578125, 0.5057601928710938, 0.5319061279296875, 0.5580520629882812, 0.584197998046875, 0.6103439331054688, 0.6364898681640625, 0.6626358032226562, 0.68878173828125, 0.7149276733398438, 0.7410736083984375, 0.7672195434570312, 0.793365478515625, 0.8195114135742188, 0.8456573486328125, 0.8718032836914062, 0.89794921875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 4.0, 8.0, 10.0, 11.0, 18.0, 40.0, 56.0, 94.0, 167.0, 364.0, 1141.0, 1254.0, 431.0, 189.0, 95.0, 62.0, 37.0, 30.0, 18.0, 13.0, 15.0, 5.0, 2.0, 7.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.22412109375, -0.2185192108154297, -0.21291732788085938, -0.20731544494628906, -0.20171356201171875, -0.19611167907714844, -0.19050979614257812, -0.1849079132080078, -0.1793060302734375, -0.1737041473388672, -0.16810226440429688, -0.16250038146972656, -0.15689849853515625, -0.15129661560058594, -0.14569473266601562, -0.1400928497314453, -0.134490966796875, -0.1288890838623047, -0.12328720092773438, -0.11768531799316406, -0.11208343505859375, -0.10648155212402344, -0.10087966918945312, -0.09527778625488281, -0.0896759033203125, -0.08407402038574219, -0.07847213745117188, -0.07287025451660156, -0.06726837158203125, -0.06166648864746094, -0.056064605712890625, -0.05046272277832031, -0.04486083984375, -0.03925895690917969, -0.033657073974609375, -0.028055191040039062, -0.02245330810546875, -0.016851425170898438, -0.011249542236328125, -0.0056476593017578125, -4.57763671875e-05, 0.0055561065673828125, 0.011157989501953125, 0.016759872436523438, 0.02236175537109375, 0.027963638305664062, 0.033565521240234375, 0.03916740417480469, 0.044769287109375, 0.05037117004394531, 0.055973052978515625, 0.06157493591308594, 0.06717681884765625, 0.07277870178222656, 0.07838058471679688, 0.08398246765136719, 0.0895843505859375, 0.09518623352050781, 0.10078811645507812, 0.10638999938964844, 0.11199188232421875, 0.11759376525878906, 0.12319564819335938, 0.1287975311279297, 0.1343994140625]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 7.0, 12.0, 33.0, 117.0, 303.0, 340.0, 134.0, 35.0, 10.0, 8.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0341618061065674, -1.988869547843933, -1.9435774087905884, -1.898285150527954, -1.8529930114746094, -1.807700753211975, -1.7624086141586304, -1.717116355895996, -1.6718242168426514, -1.626531958580017, -1.5812398195266724, -1.535947561264038, -1.4906554222106934, -1.445363163948059, -1.4000710248947144, -1.35477876663208, -1.3094866275787354, -1.264194369316101, -1.2189022302627563, -1.173609972000122, -1.1283178329467773, -1.083025574684143, -1.0377334356307983, -0.9924411773681641, -0.9471489191055298, -0.9018567204475403, -0.8565645217895508, -0.8112723231315613, -0.7659801244735718, -0.7206879258155823, -0.6753957271575928, -0.6301034688949585, -0.5848113298416138, -0.5395191311836243, -0.49422693252563477, -0.44893473386764526, -0.40364253520965576, -0.35835033655166626, -0.31305810809135437, -0.26776590943336487, -0.22247371077537537, -0.17718151211738586, -0.13188931345939636, -0.08659709990024567, -0.041304901242256165, 0.003987297415733337, 0.04927951097488403, 0.09457170963287354, 0.13986390829086304, 0.18515610694885254, 0.23044830560684204, 0.27574050426483154, 0.32103270292282104, 0.36632490158081055, 0.41161713004112244, 0.45690932869911194, 0.5022015571594238, 0.5474937558174133, 0.5927859544754028, 0.6380781531333923, 0.6833703517913818, 0.7286625504493713, 0.7739547491073608, 0.8192470073699951, 0.8645391464233398]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 10.0, 11.0, 10.0, 11.0, 28.0, 16.0, 22.0, 41.0, 42.0, 34.0, 34.0, 45.0, 48.0, 49.0, 51.0, 49.0, 60.0, 57.0, 54.0, 55.0, 38.0, 44.0, 29.0, 31.0, 21.0, 21.0, 19.0, 12.0, 14.0, 12.0, 9.0, 1.0, 7.0, 4.0, 6.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.5313940644264221, -0.5143440961837769, -0.4972941279411316, -0.4802441895008087, -0.46319422125816345, -0.4461442530155182, -0.4290943145751953, -0.41204434633255005, -0.3949943780899048, -0.3779444098472595, -0.36089444160461426, -0.3438445031642914, -0.3267945349216461, -0.30974456667900085, -0.292694628238678, -0.2756446599960327, -0.25859469175338745, -0.2415447235107422, -0.22449477016925812, -0.20744481682777405, -0.19039484858512878, -0.17334488034248352, -0.15629492700099945, -0.13924497365951538, -0.12219500541687012, -0.10514504462480545, -0.08809508383274078, -0.07104512304067612, -0.05399516224861145, -0.03694520145654678, -0.019895240664482117, -0.00284527987241745, 0.014204680919647217, 0.031254641711711884, 0.04830460250377655, 0.06535456329584122, 0.08240452408790588, 0.09945448487997055, 0.11650444567203522, 0.1335543990135193, 0.15060436725616455, 0.16765433549880981, 0.18470428884029388, 0.20175424218177795, 0.21880421042442322, 0.23585417866706848, 0.25290411710739136, 0.2699540853500366, 0.2870040535926819, 0.30405402183532715, 0.3211039900779724, 0.3381539285182953, 0.35520389676094055, 0.3722538650035858, 0.3893038034439087, 0.40635377168655396, 0.4234037399291992, 0.4404537081718445, 0.45750367641448975, 0.4745536148548126, 0.4916035830974579, 0.5086535215377808, 0.525703489780426, 0.5427534580230713, 0.5598034262657166]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 6.0, 6.0, 7.0, 12.0, 17.0, 25.0, 39.0, 72.0, 144.0, 209.0, 439.0, 1016.0, 2747.0, 12341.0, 316963.0, 687017.0, 21328.0, 3704.0, 1293.0, 566.0, 259.0, 116.0, 78.0, 54.0, 25.0, 25.0, 11.0, 11.0, 9.0, 6.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.12890625, -1.094818115234375, -1.06072998046875, -1.026641845703125, -0.9925537109375, -0.958465576171875, -0.92437744140625, -0.890289306640625, -0.856201171875, -0.822113037109375, -0.78802490234375, -0.753936767578125, -0.7198486328125, -0.685760498046875, -0.65167236328125, -0.617584228515625, -0.58349609375, -0.549407958984375, -0.51531982421875, -0.481231689453125, -0.4471435546875, -0.413055419921875, -0.37896728515625, -0.344879150390625, -0.310791015625, -0.276702880859375, -0.24261474609375, -0.208526611328125, -0.1744384765625, -0.140350341796875, -0.10626220703125, -0.072174072265625, -0.0380859375, -0.003997802734375, 0.03009033203125, 0.064178466796875, 0.0982666015625, 0.132354736328125, 0.16644287109375, 0.200531005859375, 0.234619140625, 0.268707275390625, 0.30279541015625, 0.336883544921875, 0.3709716796875, 0.405059814453125, 0.43914794921875, 0.473236083984375, 0.50732421875, 0.541412353515625, 0.57550048828125, 0.609588623046875, 0.6436767578125, 0.677764892578125, 0.71185302734375, 0.745941162109375, 0.780029296875, 0.814117431640625, 0.84820556640625, 0.882293701171875, 0.9163818359375, 0.950469970703125, 0.98455810546875, 1.018646240234375, 1.052734375]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 7.0, 18.0, 39.0, 77.0, 104.0, 147.0, 193.0, 141.0, 106.0, 68.0, 40.0, 30.0, 10.0, 2.0, 4.0, 4.0, 2.0, 5.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.191162109375, -0.18593978881835938, -0.18071746826171875, -0.17549514770507812, -0.1702728271484375, -0.16505050659179688, -0.15982818603515625, -0.15460586547851562, -0.149383544921875, -0.14416122436523438, -0.13893890380859375, -0.13371658325195312, -0.1284942626953125, -0.12327194213867188, -0.11804962158203125, -0.11282730102539062, -0.10760498046875, -0.10238265991210938, -0.09716033935546875, -0.09193801879882812, -0.0867156982421875, -0.08149337768554688, -0.07627105712890625, -0.07104873657226562, -0.065826416015625, -0.060604095458984375, -0.05538177490234375, -0.050159454345703125, -0.0449371337890625, -0.039714813232421875, -0.03449249267578125, -0.029270172119140625, -0.0240478515625, -0.018825531005859375, -0.01360321044921875, -0.008380889892578125, -0.0031585693359375, 0.002063751220703125, 0.00728607177734375, 0.012508392333984375, 0.017730712890625, 0.022953033447265625, 0.02817535400390625, 0.033397674560546875, 0.0386199951171875, 0.043842315673828125, 0.04906463623046875, 0.054286956787109375, 0.05950927734375, 0.06473159790039062, 0.06995391845703125, 0.07517623901367188, 0.0803985595703125, 0.08562088012695312, 0.09084320068359375, 0.09606552124023438, 0.101287841796875, 0.10651016235351562, 0.11173248291015625, 0.11695480346679688, 0.1221771240234375, 0.12739944458007812, 0.13262176513671875, 0.13784408569335938, 0.14306640625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 7.0, 13.0, 11.0, 13.0, 22.0, 28.0, 46.0, 75.0, 135.0, 165.0, 292.0, 519.0, 1021.0, 2325.0, 6574.0, 22683.0, 108009.0, 539969.0, 297058.0, 49870.0, 12417.0, 3958.0, 1530.0, 761.0, 378.0, 234.0, 133.0, 87.0, 78.0, 51.0, 33.0, 24.0, 13.0, 8.0, 6.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.420654296875, -0.4049415588378906, -0.38922882080078125, -0.3735160827636719, -0.3578033447265625, -0.3420906066894531, -0.32637786865234375, -0.3106651306152344, -0.294952392578125, -0.2792396545410156, -0.26352691650390625, -0.24781417846679688, -0.2321014404296875, -0.21638870239257812, -0.20067596435546875, -0.18496322631835938, -0.16925048828125, -0.15353775024414062, -0.13782501220703125, -0.12211227416992188, -0.1063995361328125, -0.09068679809570312, -0.07497406005859375, -0.059261322021484375, -0.043548583984375, -0.027835845947265625, -0.01212310791015625, 0.003589630126953125, 0.0193023681640625, 0.035015106201171875, 0.05072784423828125, 0.06644058227539062, 0.0821533203125, 0.09786605834960938, 0.11357879638671875, 0.12929153442382812, 0.1450042724609375, 0.16071701049804688, 0.17642974853515625, 0.19214248657226562, 0.207855224609375, 0.22356796264648438, 0.23928070068359375, 0.2549934387207031, 0.2707061767578125, 0.2864189147949219, 0.30213165283203125, 0.3178443908691406, 0.33355712890625, 0.3492698669433594, 0.36498260498046875, 0.3806953430175781, 0.3964080810546875, 0.4121208190917969, 0.42783355712890625, 0.4435462951660156, 0.459259033203125, 0.4749717712402344, 0.49068450927734375, 0.5063972473144531, 0.5221099853515625, 0.5378227233886719, 0.5535354614257812, 0.5692481994628906, 0.5849609375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 2.0, 4.0, 4.0, 7.0, 15.0, 20.0, 13.0, 24.0, 23.0, 35.0, 39.0, 53.0, 42.0, 57.0, 51.0, 70.0, 66.0, 66.0, 51.0, 62.0, 59.0, 41.0, 47.0, 28.0, 25.0, 19.0, 19.0, 12.0, 15.0, 14.0, 9.0, 5.0, 4.0, 5.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.423828125, -0.40727996826171875, -0.3907318115234375, -0.37418365478515625, -0.357635498046875, -0.34108734130859375, -0.3245391845703125, -0.30799102783203125, -0.29144287109375, -0.27489471435546875, -0.2583465576171875, -0.24179840087890625, -0.225250244140625, -0.20870208740234375, -0.1921539306640625, -0.17560577392578125, -0.1590576171875, -0.14250946044921875, -0.1259613037109375, -0.10941314697265625, -0.092864990234375, -0.07631683349609375, -0.0597686767578125, -0.04322052001953125, -0.02667236328125, -0.01012420654296875, 0.0064239501953125, 0.02297210693359375, 0.039520263671875, 0.05606842041015625, 0.0726165771484375, 0.08916473388671875, 0.105712890625, 0.12226104736328125, 0.1388092041015625, 0.15535736083984375, 0.171905517578125, 0.18845367431640625, 0.2050018310546875, 0.22154998779296875, 0.23809814453125, 0.25464630126953125, 0.2711944580078125, 0.28774261474609375, 0.304290771484375, 0.32083892822265625, 0.3373870849609375, 0.35393524169921875, 0.3704833984375, 0.38703155517578125, 0.4035797119140625, 0.42012786865234375, 0.436676025390625, 0.45322418212890625, 0.4697723388671875, 0.48632049560546875, 0.50286865234375, 0.5194168090820312, 0.5359649658203125, 0.5525131225585938, 0.569061279296875, 0.5856094360351562, 0.6021575927734375, 0.6187057495117188, 0.63525390625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 3.0, 3.0, 2.0, 13.0, 17.0, 22.0, 43.0, 59.0, 122.0, 325.0, 965.0, 4850.0, 73843.0, 813265.0, 145028.0, 7971.0, 1312.0, 373.0, 167.0, 73.0, 35.0, 24.0, 15.0, 8.0, 5.0, 2.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.3955078125, -0.3849906921386719, -0.37447357177734375, -0.3639564514160156, -0.3534393310546875, -0.3429222106933594, -0.33240509033203125, -0.3218879699707031, -0.311370849609375, -0.3008537292480469, -0.29033660888671875, -0.2798194885253906, -0.2693023681640625, -0.2587852478027344, -0.24826812744140625, -0.23775100708007812, -0.22723388671875, -0.21671676635742188, -0.20619964599609375, -0.19568252563476562, -0.1851654052734375, -0.17464828491210938, -0.16413116455078125, -0.15361404418945312, -0.143096923828125, -0.13257980346679688, -0.12206268310546875, -0.11154556274414062, -0.1010284423828125, -0.09051132202148438, -0.07999420166015625, -0.06947708129882812, -0.0589599609375, -0.048442840576171875, -0.03792572021484375, -0.027408599853515625, -0.0168914794921875, -0.006374359130859375, 0.00414276123046875, 0.014659881591796875, 0.025177001953125, 0.035694122314453125, 0.04621124267578125, 0.056728363037109375, 0.0672454833984375, 0.07776260375976562, 0.08827972412109375, 0.09879684448242188, 0.10931396484375, 0.11983108520507812, 0.13034820556640625, 0.14086532592773438, 0.1513824462890625, 0.16189956665039062, 0.17241668701171875, 0.18293380737304688, 0.193450927734375, 0.20396804809570312, 0.21448516845703125, 0.22500228881835938, 0.2355194091796875, 0.24603652954101562, 0.25655364990234375, 0.2670707702636719, 0.277587890625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 4.0, 4.0, 13.0, 7.0, 16.0, 14.0, 19.0, 20.0, 39.0, 37.0, 53.0, 84.0, 180.0, 170.0, 118.0, 59.0, 40.0, 34.0, 27.0, 13.0, 19.0, 8.0, 5.0, 5.0, 3.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011676549911499023, -0.00011171307414770126, -0.00010666064918041229, -0.00010160822421312332, -9.655579924583435e-05, -9.150337427854538e-05, -8.645094931125641e-05, -8.139852434396744e-05, -7.634609937667847e-05, -7.12936744093895e-05, -6.624124944210052e-05, -6.118882447481155e-05, -5.613639950752258e-05, -5.108397454023361e-05, -4.603154957294464e-05, -4.097912460565567e-05, -3.59266996383667e-05, -3.087427467107773e-05, -2.5821849703788757e-05, -2.0769424736499786e-05, -1.5716999769210815e-05, -1.0664574801921844e-05, -5.6121498346328735e-06, -5.597248673439026e-07, 4.492700099945068e-06, 9.54512506723404e-06, 1.459755003452301e-05, 1.964997500181198e-05, 2.4702399969100952e-05, 2.9754824936389923e-05, 3.4807249903678894e-05, 3.9859674870967865e-05, 4.4912099838256836e-05, 4.996452480554581e-05, 5.501694977283478e-05, 6.006937474012375e-05, 6.512179970741272e-05, 7.017422467470169e-05, 7.522664964199066e-05, 8.027907460927963e-05, 8.53314995765686e-05, 9.038392454385757e-05, 9.543634951114655e-05, 0.00010048877447843552, 0.00010554119944572449, 0.00011059362441301346, 0.00011564604938030243, 0.0001206984743475914, 0.00012575089931488037, 0.00013080332428216934, 0.0001358557492494583, 0.00014090817421674728, 0.00014596059918403625, 0.00015101302415132523, 0.0001560654491186142, 0.00016111787408590317, 0.00016617029905319214, 0.0001712227240204811, 0.00017627514898777008, 0.00018132757395505905, 0.00018637999892234802, 0.000191432423889637, 0.00019648484885692596, 0.00020153727382421494, 0.0002065896987915039]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 4.0, 6.0, 6.0, 7.0, 6.0, 18.0, 20.0, 40.0, 33.0, 53.0, 67.0, 117.0, 161.0, 280.0, 462.0, 925.0, 2056.0, 5391.0, 19134.0, 91749.0, 444680.0, 381367.0, 76843.0, 16530.0, 4798.0, 1775.0, 797.0, 430.0, 263.0, 201.0, 90.0, 73.0, 45.0, 33.0, 19.0, 18.0, 14.0, 11.0, 7.0, 3.0, 3.0, 5.0, 7.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.1976318359375, -0.1916332244873047, -0.18563461303710938, -0.17963600158691406, -0.17363739013671875, -0.16763877868652344, -0.16164016723632812, -0.1556415557861328, -0.1496429443359375, -0.1436443328857422, -0.13764572143554688, -0.13164710998535156, -0.12564849853515625, -0.11964988708496094, -0.11365127563476562, -0.10765266418457031, -0.101654052734375, -0.09565544128417969, -0.08965682983398438, -0.08365821838378906, -0.07765960693359375, -0.07166099548339844, -0.06566238403320312, -0.05966377258300781, -0.0536651611328125, -0.04766654968261719, -0.041667938232421875, -0.03566932678222656, -0.02967071533203125, -0.023672103881835938, -0.017673492431640625, -0.011674880981445312, -0.00567626953125, 0.0003223419189453125, 0.006320953369140625, 0.012319564819335938, 0.01831817626953125, 0.024316787719726562, 0.030315399169921875, 0.03631401062011719, 0.0423126220703125, 0.04831123352050781, 0.054309844970703125, 0.06030845642089844, 0.06630706787109375, 0.07230567932128906, 0.07830429077148438, 0.08430290222167969, 0.090301513671875, 0.09630012512207031, 0.10229873657226562, 0.10829734802246094, 0.11429595947265625, 0.12029457092285156, 0.12629318237304688, 0.1322917938232422, 0.1382904052734375, 0.1442890167236328, 0.15028762817382812, 0.15628623962402344, 0.16228485107421875, 0.16828346252441406, 0.17428207397460938, 0.1802806854248047, 0.186279296875]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 4.0, 3.0, 4.0, 14.0, 10.0, 10.0, 21.0, 28.0, 29.0, 34.0, 55.0, 63.0, 77.0, 76.0, 97.0, 110.0, 93.0, 75.0, 55.0, 36.0, 22.0, 23.0, 19.0, 12.0, 7.0, 7.0, 2.0, 7.0, 3.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.19873046875, -0.19358444213867188, -0.18843841552734375, -0.18329238891601562, -0.1781463623046875, -0.17300033569335938, -0.16785430908203125, -0.16270828247070312, -0.157562255859375, -0.15241622924804688, -0.14727020263671875, -0.14212417602539062, -0.1369781494140625, -0.13183212280273438, -0.12668609619140625, -0.12154006958007812, -0.11639404296875, -0.11124801635742188, -0.10610198974609375, -0.10095596313476562, -0.0958099365234375, -0.09066390991210938, -0.08551788330078125, -0.08037185668945312, -0.075225830078125, -0.07007980346679688, -0.06493377685546875, -0.059787750244140625, -0.0546417236328125, -0.049495697021484375, -0.04434967041015625, -0.039203643798828125, -0.0340576171875, -0.028911590576171875, -0.02376556396484375, -0.018619537353515625, -0.0134735107421875, -0.008327484130859375, -0.00318145751953125, 0.001964569091796875, 0.007110595703125, 0.012256622314453125, 0.01740264892578125, 0.022548675537109375, 0.0276947021484375, 0.032840728759765625, 0.03798675537109375, 0.043132781982421875, 0.04827880859375, 0.053424835205078125, 0.05857086181640625, 0.06371688842773438, 0.0688629150390625, 0.07400894165039062, 0.07915496826171875, 0.08430099487304688, 0.089447021484375, 0.09459304809570312, 0.09973907470703125, 0.10488510131835938, 0.1100311279296875, 0.11517715454101562, 0.12032318115234375, 0.12546920776367188, 0.130615234375]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 6.0, 5.0, 4.0, 12.0, 11.0, 22.0, 41.0, 84.0, 185.0, 276.0, 200.0, 83.0, 44.0, 19.0, 12.0, 2.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.305366039276123, -3.1898200511932373, -3.0742740631103516, -2.9587278366088867, -2.843181848526001, -2.7276358604431152, -2.6120896339416504, -2.4965436458587646, -2.380997657775879, -2.265451669692993, -2.1499056816101074, -2.0343594551086426, -1.9188134670257568, -1.803267478942871, -1.6877213716506958, -1.5721752643585205, -1.4566292762756348, -1.341083288192749, -1.2255371809005737, -1.1099910736083984, -0.9944450855255127, -0.8788990378379822, -0.7633529901504517, -0.6478069424629211, -0.5322608947753906, -0.4167148470878601, -0.3011687994003296, -0.18562275171279907, -0.07007670402526855, 0.04546934366226196, 0.16101539134979248, 0.276561439037323, 0.3921074867248535, 0.507653534412384, 0.6231995820999146, 0.7387456297874451, 0.8542916774749756, 0.9698377251625061, 1.0853837728500366, 1.200929880142212, 1.3164758682250977, 1.4320218563079834, 1.5475679636001587, 1.663114070892334, 1.7786600589752197, 1.8942060470581055, 2.0097522735595703, 2.125298261642456, 2.240844249725342, 2.3563902378082275, 2.4719362258911133, 2.587482452392578, 2.703028440475464, 2.8185744285583496, 2.9341206550598145, 3.0496666431427, 3.165212631225586, 3.2807586193084717, 3.3963046073913574, 3.5118508338928223, 3.627396821975708, 3.7429428100585938, 3.8584890365600586, 3.9740350246429443, 4.08958101272583]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 4.0, 5.0, 7.0, 7.0, 12.0, 16.0, 14.0, 25.0, 30.0, 30.0, 39.0, 47.0, 54.0, 60.0, 56.0, 43.0, 55.0, 58.0, 57.0, 55.0, 44.0, 50.0, 45.0, 27.0, 22.0, 26.0, 28.0, 12.0, 26.0, 14.0, 8.0, 6.0, 9.0, 8.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.258880853652954, -3.158141613006592, -3.0574026107788086, -2.9566633701324463, -2.855924129486084, -2.7551848888397217, -2.6544456481933594, -2.553706645965576, -2.452967405319214, -2.3522281646728516, -2.2514891624450684, -2.150749921798706, -2.0500106811523438, -1.9492714405059814, -1.8485323190689087, -1.747793197631836, -1.6470539569854736, -1.5463147163391113, -1.4455755949020386, -1.3448364734649658, -1.2440972328186035, -1.1433579921722412, -1.0426188707351685, -0.9418796896934509, -0.8411405086517334, -0.7404013276100159, -0.6396621465682983, -0.5389229655265808, -0.4381837844848633, -0.33744460344314575, -0.23670542240142822, -0.1359662413597107, -0.035227298736572266, 0.06551188230514526, 0.1662510633468628, 0.2669902443885803, 0.36772942543029785, 0.4684686064720154, 0.5692077875137329, 0.6699469685554504, 0.770686149597168, 0.8714253306388855, 0.972164511680603, 1.0729036331176758, 1.173642873764038, 1.2743821144104004, 1.3751212358474731, 1.475860357284546, 1.5765995979309082, 1.6773388385772705, 1.7780779600143433, 1.878817081451416, 1.9795563220977783, 2.0802955627441406, 2.181034564971924, 2.281773805618286, 2.3825130462646484, 2.4832522869110107, 2.583991527557373, 2.6847305297851562, 2.7854697704315186, 2.886209011077881, 2.986948013305664, 3.0876872539520264, 3.1884264945983887]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 1.0, 4.0, 6.0, 11.0, 14.0, 14.0, 26.0, 33.0, 66.0, 107.0, 222.0, 480.0, 1019.0, 3211.0, 21715.0, 3811132.0, 341215.0, 11001.0, 2279.0, 899.0, 368.0, 160.0, 116.0, 58.0, 42.0, 29.0, 12.0, 9.0, 7.0, 8.0, 9.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.40234375, -1.36322021484375, -1.3240966796875, -1.28497314453125, -1.245849609375, -1.20672607421875, -1.1676025390625, -1.12847900390625, -1.08935546875, -1.05023193359375, -1.0111083984375, -0.97198486328125, -0.932861328125, -0.89373779296875, -0.8546142578125, -0.81549072265625, -0.7763671875, -0.73724365234375, -0.6981201171875, -0.65899658203125, -0.619873046875, -0.58074951171875, -0.5416259765625, -0.50250244140625, -0.46337890625, -0.42425537109375, -0.3851318359375, -0.34600830078125, -0.306884765625, -0.26776123046875, -0.2286376953125, -0.18951416015625, -0.150390625, -0.11126708984375, -0.0721435546875, -0.03302001953125, 0.006103515625, 0.04522705078125, 0.0843505859375, 0.12347412109375, 0.16259765625, 0.20172119140625, 0.2408447265625, 0.27996826171875, 0.319091796875, 0.35821533203125, 0.3973388671875, 0.43646240234375, 0.4755859375, 0.51470947265625, 0.5538330078125, 0.59295654296875, 0.632080078125, 0.67120361328125, 0.7103271484375, 0.74945068359375, 0.78857421875, 0.82769775390625, 0.8668212890625, 0.90594482421875, 0.945068359375, 0.98419189453125, 1.0233154296875, 1.06243896484375, 1.1015625]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 5.0, 8.0, 17.0, 28.0, 47.0, 65.0, 109.0, 101.0, 154.0, 127.0, 113.0, 76.0, 62.0, 41.0, 18.0, 12.0, 8.0, 8.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.188720703125, -0.18314170837402344, -0.17756271362304688, -0.1719837188720703, -0.16640472412109375, -0.1608257293701172, -0.15524673461914062, -0.14966773986816406, -0.1440887451171875, -0.13850975036621094, -0.13293075561523438, -0.1273517608642578, -0.12177276611328125, -0.11619377136230469, -0.11061477661132812, -0.10503578186035156, -0.099456787109375, -0.09387779235839844, -0.08829879760742188, -0.08271980285644531, -0.07714080810546875, -0.07156181335449219, -0.06598281860351562, -0.06040382385253906, -0.0548248291015625, -0.04924583435058594, -0.043666839599609375, -0.03808784484863281, -0.03250885009765625, -0.026929855346679688, -0.021350860595703125, -0.015771865844726562, -0.01019287109375, -0.0046138763427734375, 0.000965118408203125, 0.0065441131591796875, 0.01212310791015625, 0.017702102661132812, 0.023281097412109375, 0.028860092163085938, 0.0344390869140625, 0.04001808166503906, 0.045597076416015625, 0.05117607116699219, 0.05675506591796875, 0.06233406066894531, 0.06791305541992188, 0.07349205017089844, 0.079071044921875, 0.08465003967285156, 0.09022903442382812, 0.09580802917480469, 0.10138702392578125, 0.10696601867675781, 0.11254501342773438, 0.11812400817871094, 0.1237030029296875, 0.12928199768066406, 0.13486099243164062, 0.1404399871826172, 0.14601898193359375, 0.1515979766845703, 0.15717697143554688, 0.16275596618652344, 0.1683349609375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 4.0, 8.0, 14.0, 14.0, 12.0, 17.0, 34.0, 43.0, 69.0, 91.0, 136.0, 170.0, 237.0, 369.0, 589.0, 1139.0, 2978.0, 11275.0, 72019.0, 3144496.0, 905804.0, 41560.0, 8189.0, 2557.0, 1084.0, 542.0, 302.0, 162.0, 126.0, 81.0, 53.0, 36.0, 22.0, 18.0, 9.0, 11.0, 5.0, 2.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.53857421875, -0.5231285095214844, -0.5076828002929688, -0.4922370910644531, -0.4767913818359375, -0.4613456726074219, -0.44589996337890625, -0.4304542541503906, -0.415008544921875, -0.3995628356933594, -0.38411712646484375, -0.3686714172363281, -0.3532257080078125, -0.3377799987792969, -0.32233428955078125, -0.3068885803222656, -0.29144287109375, -0.2759971618652344, -0.26055145263671875, -0.24510574340820312, -0.2296600341796875, -0.21421432495117188, -0.19876861572265625, -0.18332290649414062, -0.167877197265625, -0.15243148803710938, -0.13698577880859375, -0.12154006958007812, -0.1060943603515625, -0.09064865112304688, -0.07520294189453125, -0.059757232666015625, -0.0443115234375, -0.028865814208984375, -0.01342010498046875, 0.002025604248046875, 0.0174713134765625, 0.032917022705078125, 0.04836273193359375, 0.06380844116210938, 0.079254150390625, 0.09469985961914062, 0.11014556884765625, 0.12559127807617188, 0.1410369873046875, 0.15648269653320312, 0.17192840576171875, 0.18737411499023438, 0.20281982421875, 0.21826553344726562, 0.23371124267578125, 0.24915695190429688, 0.2646026611328125, 0.2800483703613281, 0.29549407958984375, 0.3109397888183594, 0.326385498046875, 0.3418312072753906, 0.35727691650390625, 0.3727226257324219, 0.3881683349609375, 0.4036140441894531, 0.41905975341796875, 0.4345054626464844, 0.449951171875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 6.0, 16.0, 21.0, 29.0, 48.0, 116.0, 303.0, 1155.0, 1700.0, 363.0, 157.0, 69.0, 41.0, 13.0, 14.0, 12.0, 6.0, 1.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.261962890625, -0.2552661895751953, -0.24856948852539062, -0.24187278747558594, -0.23517608642578125, -0.22847938537597656, -0.22178268432617188, -0.2150859832763672, -0.2083892822265625, -0.2016925811767578, -0.19499588012695312, -0.18829917907714844, -0.18160247802734375, -0.17490577697753906, -0.16820907592773438, -0.1615123748779297, -0.154815673828125, -0.1481189727783203, -0.14142227172851562, -0.13472557067871094, -0.12802886962890625, -0.12133216857910156, -0.11463546752929688, -0.10793876647949219, -0.1012420654296875, -0.09454536437988281, -0.08784866333007812, -0.08115196228027344, -0.07445526123046875, -0.06775856018066406, -0.061061859130859375, -0.05436515808105469, -0.04766845703125, -0.04097175598144531, -0.034275054931640625, -0.027578353881835938, -0.02088165283203125, -0.014184951782226562, -0.007488250732421875, -0.0007915496826171875, 0.0059051513671875, 0.012601852416992188, 0.019298553466796875, 0.025995254516601562, 0.03269195556640625, 0.03938865661621094, 0.046085357666015625, 0.05278205871582031, 0.059478759765625, 0.06617546081542969, 0.07287216186523438, 0.07956886291503906, 0.08626556396484375, 0.09296226501464844, 0.09965896606445312, 0.10635566711425781, 0.1130523681640625, 0.11974906921386719, 0.12644577026367188, 0.13314247131347656, 0.13983917236328125, 0.14653587341308594, 0.15323257446289062, 0.1599292755126953, 0.1666259765625]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 7.0, 21.0, 79.0, 247.0, 395.0, 177.0, 56.0, 14.0, 5.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2514867782592773, -1.2057465314865112, -1.1600062847137451, -1.114266037940979, -1.068525791168213, -1.0227855443954468, -0.9770452976226807, -0.9313050508499146, -0.8855648040771484, -0.8398245573043823, -0.7940843105316162, -0.7483440637588501, -0.702603816986084, -0.6568635702133179, -0.6111233234405518, -0.5653830766677856, -0.5196428894996643, -0.4739026427268982, -0.4281623959541321, -0.38242214918136597, -0.33668190240859985, -0.29094165563583374, -0.24520143866539001, -0.1994611918926239, -0.1537209451198578, -0.10798069834709167, -0.06224045902490616, -0.016500219702720642, 0.02924002707004547, 0.07498027384281158, 0.1207205057144165, 0.16646075248718262, 0.21220099925994873, 0.25794124603271484, 0.30368149280548096, 0.34942173957824707, 0.3951619863510132, 0.4409022331237793, 0.486642450094223, 0.5323827266693115, 0.5781229734420776, 0.6238632202148438, 0.6696034669876099, 0.715343713760376, 0.7610839605331421, 0.8068242073059082, 0.8525644540786743, 0.8983047008514404, 0.9440448880195618, 0.9897851347923279, 1.0355253219604492, 1.0812655687332153, 1.1270058155059814, 1.1727460622787476, 1.2184863090515137, 1.2642265558242798, 1.309966802597046, 1.355707049369812, 1.4014472961425781, 1.4471875429153442, 1.4929277896881104, 1.5386680364608765, 1.5844082832336426, 1.6301485300064087, 1.6758887767791748]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 6.0, 0.0, 4.0, 8.0, 11.0, 16.0, 16.0, 12.0, 30.0, 23.0, 27.0, 38.0, 47.0, 58.0, 41.0, 50.0, 54.0, 64.0, 55.0, 46.0, 62.0, 42.0, 43.0, 54.0, 35.0, 30.0, 40.0, 20.0, 19.0, 15.0, 8.0, 11.0, 3.0, 5.0, 3.0, 4.0, 4.0, 6.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5758954286575317, -0.5598230361938477, -0.5437506437301636, -0.5276781916618347, -0.5116057991981506, -0.49553340673446655, -0.47946101427078247, -0.463388592004776, -0.44731616973876953, -0.43124377727508545, -0.415171355009079, -0.3990989625453949, -0.3830265402793884, -0.36695414781570435, -0.35088175535202026, -0.3348093330860138, -0.3187369406223297, -0.30266454815864563, -0.28659212589263916, -0.2705197334289551, -0.2544473111629486, -0.23837491869926453, -0.22230251133441925, -0.20623010396957397, -0.1901576966047287, -0.17408528923988342, -0.15801288187503815, -0.14194047451019287, -0.1258680820465088, -0.10979566723108292, -0.09372326731681824, -0.07765085995197296, -0.061578452587127686, -0.04550604522228241, -0.029433641582727432, -0.013361237943172455, 0.002711169421672821, 0.018783576786518097, 0.034855976700782776, 0.05092838406562805, 0.06700079143047333, 0.0830731987953186, 0.09914560616016388, 0.11521800607442856, 0.13129040598869324, 0.1473628282546997, 0.1634352207183838, 0.17950762808322906, 0.19558003544807434, 0.21165244281291962, 0.2277248501777649, 0.24379724264144897, 0.25986966490745544, 0.2759420573711395, 0.292014479637146, 0.3080868721008301, 0.32415926456451416, 0.34023165702819824, 0.3563040792942047, 0.3723764717578888, 0.38844889402389526, 0.40452128648757935, 0.4205936789512634, 0.4366661012172699, 0.45273852348327637]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 7.0, 8.0, 5.0, 6.0, 13.0, 20.0, 19.0, 20.0, 28.0, 51.0, 67.0, 95.0, 114.0, 153.0, 193.0, 322.0, 489.0, 793.0, 1481.0, 3037.0, 7577.0, 23799.0, 98823.0, 461130.0, 350606.0, 69722.0, 17996.0, 6124.0, 2516.0, 1207.0, 714.0, 418.0, 252.0, 189.0, 169.0, 90.0, 75.0, 52.0, 49.0, 36.0, 17.0, 24.0, 15.0, 11.0, 7.0, 7.0, 4.0, 6.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.35791015625, -0.3470268249511719, -0.33614349365234375, -0.3252601623535156, -0.3143768310546875, -0.3034934997558594, -0.29261016845703125, -0.2817268371582031, -0.270843505859375, -0.2599601745605469, -0.24907684326171875, -0.23819351196289062, -0.2273101806640625, -0.21642684936523438, -0.20554351806640625, -0.19466018676757812, -0.18377685546875, -0.17289352416992188, -0.16201019287109375, -0.15112686157226562, -0.1402435302734375, -0.12936019897460938, -0.11847686767578125, -0.10759353637695312, -0.096710205078125, -0.08582687377929688, -0.07494354248046875, -0.06406021118164062, -0.0531768798828125, -0.042293548583984375, -0.03141021728515625, -0.020526885986328125, -0.0096435546875, 0.001239776611328125, 0.01212310791015625, 0.023006439208984375, 0.0338897705078125, 0.044773101806640625, 0.05565643310546875, 0.06653976440429688, 0.077423095703125, 0.08830642700195312, 0.09918975830078125, 0.11007308959960938, 0.1209564208984375, 0.13183975219726562, 0.14272308349609375, 0.15360641479492188, 0.16448974609375, 0.17537307739257812, 0.18625640869140625, 0.19713973999023438, 0.2080230712890625, 0.21890640258789062, 0.22978973388671875, 0.24067306518554688, 0.251556396484375, 0.2624397277832031, 0.27332305908203125, 0.2842063903808594, 0.2950897216796875, 0.3059730529785156, 0.31685638427734375, 0.3277397155761719, 0.338623046875]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 7.0, 10.0, 20.0, 46.0, 50.0, 83.0, 100.0, 124.0, 147.0, 142.0, 84.0, 74.0, 42.0, 34.0, 17.0, 9.0, 5.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.173095703125, -0.1677532196044922, -0.16241073608398438, -0.15706825256347656, -0.15172576904296875, -0.14638328552246094, -0.14104080200195312, -0.1356983184814453, -0.1303558349609375, -0.1250133514404297, -0.11967086791992188, -0.11432838439941406, -0.10898590087890625, -0.10364341735839844, -0.09830093383789062, -0.09295845031738281, -0.087615966796875, -0.08227348327636719, -0.07693099975585938, -0.07158851623535156, -0.06624603271484375, -0.06090354919433594, -0.055561065673828125, -0.05021858215332031, -0.0448760986328125, -0.03953361511230469, -0.034191131591796875, -0.028848648071289062, -0.02350616455078125, -0.018163681030273438, -0.012821197509765625, -0.0074787139892578125, -0.00213623046875, 0.0032062530517578125, 0.008548736572265625, 0.013891220092773438, 0.01923370361328125, 0.024576187133789062, 0.029918670654296875, 0.03526115417480469, 0.0406036376953125, 0.04594612121582031, 0.051288604736328125, 0.05663108825683594, 0.06197357177734375, 0.06731605529785156, 0.07265853881835938, 0.07800102233886719, 0.083343505859375, 0.08868598937988281, 0.09402847290039062, 0.09937095642089844, 0.10471343994140625, 0.11005592346191406, 0.11539840698242188, 0.12074089050292969, 0.1260833740234375, 0.1314258575439453, 0.13676834106445312, 0.14211082458496094, 0.14745330810546875, 0.15279579162597656, 0.15813827514648438, 0.1634807586669922, 0.1688232421875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 6.0, 11.0, 4.0, 6.0, 11.0, 12.0, 25.0, 21.0, 22.0, 43.0, 69.0, 77.0, 116.0, 168.0, 301.0, 467.0, 765.0, 1539.0, 3051.0, 6495.0, 15869.0, 44665.0, 154091.0, 424163.0, 275506.0, 76902.0, 25078.0, 9844.0, 4358.0, 2068.0, 1113.0, 615.0, 338.0, 210.0, 152.0, 104.0, 68.0, 52.0, 39.0, 34.0, 22.0, 14.0, 12.0, 11.0, 8.0, 3.0, 3.0, 6.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2890625, -0.2799530029296875, -0.270843505859375, -0.2617340087890625, -0.25262451171875, -0.2435150146484375, -0.234405517578125, -0.2252960205078125, -0.2161865234375, -0.2070770263671875, -0.197967529296875, -0.1888580322265625, -0.17974853515625, -0.1706390380859375, -0.161529541015625, -0.1524200439453125, -0.143310546875, -0.1342010498046875, -0.125091552734375, -0.1159820556640625, -0.10687255859375, -0.0977630615234375, -0.088653564453125, -0.0795440673828125, -0.0704345703125, -0.0613250732421875, -0.052215576171875, -0.0431060791015625, -0.03399658203125, -0.0248870849609375, -0.015777587890625, -0.0066680908203125, 0.00244140625, 0.0115509033203125, 0.020660400390625, 0.0297698974609375, 0.03887939453125, 0.0479888916015625, 0.057098388671875, 0.0662078857421875, 0.0753173828125, 0.0844268798828125, 0.093536376953125, 0.1026458740234375, 0.11175537109375, 0.1208648681640625, 0.129974365234375, 0.1390838623046875, 0.148193359375, 0.1573028564453125, 0.166412353515625, 0.1755218505859375, 0.18463134765625, 0.1937408447265625, 0.202850341796875, 0.2119598388671875, 0.2210693359375, 0.2301788330078125, 0.239288330078125, 0.2483978271484375, 0.25750732421875, 0.2666168212890625, 0.275726318359375, 0.2848358154296875, 0.2939453125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 6.0, 5.0, 4.0, 5.0, 5.0, 5.0, 4.0, 8.0, 17.0, 16.0, 16.0, 18.0, 25.0, 18.0, 34.0, 43.0, 36.0, 58.0, 35.0, 45.0, 36.0, 38.0, 50.0, 49.0, 38.0, 42.0, 46.0, 44.0, 29.0, 34.0, 37.0, 18.0, 24.0, 25.0, 13.0, 9.0, 8.0, 11.0, 12.0, 14.0, 5.0, 9.0, 5.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.40283203125, -0.3906669616699219, -0.37850189208984375, -0.3663368225097656, -0.3541717529296875, -0.3420066833496094, -0.32984161376953125, -0.3176765441894531, -0.305511474609375, -0.2933464050292969, -0.28118133544921875, -0.2690162658691406, -0.2568511962890625, -0.24468612670898438, -0.23252105712890625, -0.22035598754882812, -0.20819091796875, -0.19602584838867188, -0.18386077880859375, -0.17169570922851562, -0.1595306396484375, -0.14736557006835938, -0.13520050048828125, -0.12303543090820312, -0.110870361328125, -0.09870529174804688, -0.08654022216796875, -0.07437515258789062, -0.0622100830078125, -0.050045013427734375, -0.03787994384765625, -0.025714874267578125, -0.0135498046875, -0.001384735107421875, 0.01078033447265625, 0.022945404052734375, 0.0351104736328125, 0.047275543212890625, 0.05944061279296875, 0.07160568237304688, 0.083770751953125, 0.09593582153320312, 0.10810089111328125, 0.12026596069335938, 0.1324310302734375, 0.14459609985351562, 0.15676116943359375, 0.16892623901367188, 0.18109130859375, 0.19325637817382812, 0.20542144775390625, 0.21758651733398438, 0.2297515869140625, 0.24191665649414062, 0.25408172607421875, 0.2662467956542969, 0.278411865234375, 0.2905769348144531, 0.30274200439453125, 0.3149070739746094, 0.3270721435546875, 0.3392372131347656, 0.35140228271484375, 0.3635673522949219, 0.375732421875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 2.0, 4.0, 6.0, 11.0, 8.0, 11.0, 11.0, 8.0, 35.0, 38.0, 64.0, 83.0, 167.0, 289.0, 532.0, 1110.0, 2822.0, 8695.0, 33783.0, 158749.0, 534955.0, 238954.0, 49260.0, 12356.0, 3721.0, 1464.0, 599.0, 327.0, 185.0, 113.0, 52.0, 42.0, 28.0, 16.0, 14.0, 7.0, 8.0, 6.0, 11.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0], "bins": [-0.11907958984375, -0.1158285140991211, -0.11257743835449219, -0.10932636260986328, -0.10607528686523438, -0.10282421112060547, -0.09957313537597656, -0.09632205963134766, -0.09307098388671875, -0.08981990814208984, -0.08656883239746094, -0.08331775665283203, -0.08006668090820312, -0.07681560516357422, -0.07356452941894531, -0.0703134536743164, -0.0670623779296875, -0.0638113021850586, -0.06056022644042969, -0.05730915069580078, -0.054058074951171875, -0.05080699920654297, -0.04755592346191406, -0.044304847717285156, -0.04105377197265625, -0.037802696228027344, -0.03455162048339844, -0.03130054473876953, -0.028049468994140625, -0.02479839324951172, -0.021547317504882812, -0.018296241760253906, -0.015045166015625, -0.011794090270996094, -0.008543014526367188, -0.005291938781738281, -0.002040863037109375, 0.0012102127075195312, 0.0044612884521484375, 0.007712364196777344, 0.01096343994140625, 0.014214515686035156, 0.017465591430664062, 0.02071666717529297, 0.023967742919921875, 0.02721881866455078, 0.030469894409179688, 0.033720970153808594, 0.0369720458984375, 0.040223121643066406, 0.04347419738769531, 0.04672527313232422, 0.049976348876953125, 0.05322742462158203, 0.05647850036621094, 0.059729576110839844, 0.06298065185546875, 0.06623172760009766, 0.06948280334472656, 0.07273387908935547, 0.07598495483398438, 0.07923603057861328, 0.08248710632324219, 0.0857381820678711, 0.0889892578125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 8.0, 12.0, 11.0, 21.0, 26.0, 35.0, 37.0, 52.0, 96.0, 134.0, 142.0, 126.0, 88.0, 59.0, 45.0, 33.0, 24.0, 18.0, 11.0, 11.0, 6.0, 0.0, 5.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00020694732666015625, -0.00020219851285219193, -0.0001974496990442276, -0.00019270088523626328, -0.00018795207142829895, -0.00018320325762033463, -0.0001784544438123703, -0.00017370563000440598, -0.00016895681619644165, -0.00016420800238847733, -0.000159459188580513, -0.00015471037477254868, -0.00014996156096458435, -0.00014521274715662003, -0.0001404639333486557, -0.00013571511954069138, -0.00013096630573272705, -0.00012621749192476273, -0.0001214686781167984, -0.00011671986430883408, -0.00011197105050086975, -0.00010722223669290543, -0.0001024734228849411, -9.772460907697678e-05, -9.297579526901245e-05, -8.822698146104813e-05, -8.34781676530838e-05, -7.872935384511948e-05, -7.398054003715515e-05, -6.923172622919083e-05, -6.44829124212265e-05, -5.9734098613262177e-05, -5.498528480529785e-05, -5.0236470997333527e-05, -4.54876571893692e-05, -4.073884338140488e-05, -3.599002957344055e-05, -3.124121576547623e-05, -2.6492401957511902e-05, -2.1743588149547577e-05, -1.6994774341583252e-05, -1.2245960533618927e-05, -7.497146725654602e-06, -2.748332917690277e-06, 2.000480890274048e-06, 6.749294698238373e-06, 1.1498108506202698e-05, 1.6246922314167023e-05, 2.0995736122131348e-05, 2.5744549930095673e-05, 3.0493363738059998e-05, 3.524217754602432e-05, 3.999099135398865e-05, 4.473980516195297e-05, 4.94886189699173e-05, 5.423743277788162e-05, 5.898624658584595e-05, 6.373506039381027e-05, 6.84838742017746e-05, 7.323268800973892e-05, 7.798150181770325e-05, 8.273031562566757e-05, 8.74791294336319e-05, 9.222794324159622e-05, 9.697675704956055e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 8.0, 6.0, 13.0, 14.0, 23.0, 46.0, 51.0, 92.0, 148.0, 213.0, 414.0, 769.0, 1629.0, 4070.0, 12952.0, 53072.0, 251757.0, 530099.0, 146607.0, 32512.0, 8529.0, 2849.0, 1258.0, 591.0, 325.0, 166.0, 122.0, 57.0, 41.0, 31.0, 17.0, 21.0, 17.0, 10.0, 7.0, 6.0, 3.0, 6.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.11688232421875, -0.11347770690917969, -0.11007308959960938, -0.10666847229003906, -0.10326385498046875, -0.09985923767089844, -0.09645462036132812, -0.09305000305175781, -0.0896453857421875, -0.08624076843261719, -0.08283615112304688, -0.07943153381347656, -0.07602691650390625, -0.07262229919433594, -0.06921768188476562, -0.06581306457519531, -0.062408447265625, -0.05900382995605469, -0.055599212646484375, -0.05219459533691406, -0.04878997802734375, -0.04538536071777344, -0.041980743408203125, -0.03857612609863281, -0.0351715087890625, -0.03176689147949219, -0.028362274169921875, -0.024957656860351562, -0.02155303955078125, -0.018148422241210938, -0.014743804931640625, -0.011339187622070312, -0.0079345703125, -0.0045299530029296875, -0.001125335693359375, 0.0022792816162109375, 0.00568389892578125, 0.009088516235351562, 0.012493133544921875, 0.015897750854492188, 0.0193023681640625, 0.022706985473632812, 0.026111602783203125, 0.029516220092773438, 0.03292083740234375, 0.03632545471191406, 0.039730072021484375, 0.04313468933105469, 0.046539306640625, 0.04994392395019531, 0.053348541259765625, 0.05675315856933594, 0.06015777587890625, 0.06356239318847656, 0.06696701049804688, 0.07037162780761719, 0.0737762451171875, 0.07718086242675781, 0.08058547973632812, 0.08399009704589844, 0.08739471435546875, 0.09079933166503906, 0.09420394897460938, 0.09760856628417969, 0.10101318359375]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 5.0, 8.0, 17.0, 18.0, 28.0, 41.0, 67.0, 85.0, 105.0, 106.0, 110.0, 108.0, 97.0, 55.0, 53.0, 33.0, 30.0, 13.0, 9.0, 4.0, 4.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1502685546875, -0.14612293243408203, -0.14197731018066406, -0.1378316879272461, -0.13368606567382812, -0.12954044342041016, -0.1253948211669922, -0.12124919891357422, -0.11710357666015625, -0.11295795440673828, -0.10881233215332031, -0.10466670989990234, -0.10052108764648438, -0.0963754653930664, -0.09222984313964844, -0.08808422088623047, -0.0839385986328125, -0.07979297637939453, -0.07564735412597656, -0.0715017318725586, -0.06735610961914062, -0.06321048736572266, -0.05906486511230469, -0.05491924285888672, -0.05077362060546875, -0.04662799835205078, -0.04248237609863281, -0.038336753845214844, -0.034191131591796875, -0.030045509338378906, -0.025899887084960938, -0.02175426483154297, -0.017608642578125, -0.013463020324707031, -0.009317398071289062, -0.005171775817871094, -0.001026153564453125, 0.0031194686889648438, 0.0072650909423828125, 0.011410713195800781, 0.01555633544921875, 0.01970195770263672, 0.023847579956054688, 0.027993202209472656, 0.032138824462890625, 0.036284446716308594, 0.04043006896972656, 0.04457569122314453, 0.0487213134765625, 0.05286693572998047, 0.05701255798339844, 0.061158180236816406, 0.06530380249023438, 0.06944942474365234, 0.07359504699707031, 0.07774066925048828, 0.08188629150390625, 0.08603191375732422, 0.09017753601074219, 0.09432315826416016, 0.09846878051757812, 0.1026144027709961, 0.10676002502441406, 0.11090564727783203, 0.11505126953125]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 4.0, 19.0, 9.0, 13.0, 39.0, 54.0, 122.0, 204.0, 226.0, 118.0, 79.0, 37.0, 23.0, 21.0, 16.0, 7.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.877943515777588, -1.7968614101409912, -1.715779423713684, -1.6346973180770874, -1.5536153316497803, -1.4725332260131836, -1.391451120376587, -1.3103690147399902, -1.229287028312683, -1.1482049226760864, -1.0671229362487793, -0.9860408306121826, -0.9049587845802307, -0.8238767385482788, -0.7427946329116821, -0.6617125868797302, -0.5806305408477783, -0.4995484948158264, -0.4184664189815521, -0.33738434314727783, -0.2563022971153259, -0.17522025108337402, -0.09413817524909973, -0.01305609941482544, 0.06802594661712646, 0.14910800755023956, 0.23019006848335266, 0.31127214431762695, 0.39235419034957886, 0.47343623638153076, 0.5545183420181274, 0.6356003880500793, 0.7166826725006104, 0.7977647185325623, 0.8788467645645142, 0.9599288702011108, 1.041010856628418, 1.1220929622650146, 1.2031750679016113, 1.284257173538208, 1.3653391599655151, 1.4464212656021118, 1.527503252029419, 1.6085853576660156, 1.6896674633026123, 1.7707494497299194, 1.8518315553665161, 1.9329135417938232, 2.01399564743042, 2.0950777530670166, 2.1761598587036133, 2.257241725921631, 2.3383238315582275, 2.419405937194824, 2.500488042831421, 2.5815701484680176, 2.662652015686035, 2.743734121322632, 2.8248162269592285, 2.905898094177246, 2.9869801998138428, 3.0680623054504395, 3.149144411087036, 3.230226516723633, 3.3113086223602295]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 4.0, 3.0, 4.0, 3.0, 3.0, 2.0, 5.0, 3.0, 7.0, 9.0, 12.0, 10.0, 9.0, 16.0, 25.0, 21.0, 33.0, 26.0, 32.0, 36.0, 40.0, 47.0, 35.0, 43.0, 50.0, 41.0, 47.0, 47.0, 51.0, 42.0, 38.0, 36.0, 28.0, 27.0, 30.0, 20.0, 16.0, 17.0, 9.0, 12.0, 10.0, 7.0, 9.0, 8.0, 6.0, 8.0, 2.0, 3.0, 2.0, 1.0, 7.0, 1.0, 3.0, 2.0, 1.0, 1.0], "bins": [-2.3410449028015137, -2.270845651626587, -2.20064640045166, -2.1304471492767334, -2.0602478981018066, -1.9900486469268799, -1.9198493957519531, -1.8496501445770264, -1.7794508934020996, -1.7092516422271729, -1.639052391052246, -1.5688531398773193, -1.4986538887023926, -1.4284546375274658, -1.358255386352539, -1.2880561351776123, -1.2178568840026855, -1.1476576328277588, -1.077458381652832, -1.0072591304779053, -0.9370598793029785, -0.8668606281280518, -0.796661376953125, -0.7264621257781982, -0.6562628746032715, -0.5860636234283447, -0.515864372253418, -0.4456651210784912, -0.37546586990356445, -0.3052666187286377, -0.23506736755371094, -0.16486811637878418, -0.09466910362243652, -0.024469852447509766, 0.04572939872741699, 0.11592864990234375, 0.1861279010772705, 0.25632715225219727, 0.326526403427124, 0.3967256546020508, 0.46692490577697754, 0.5371241569519043, 0.607323408126831, 0.6775226593017578, 0.7477219104766846, 0.8179211616516113, 0.8881204128265381, 0.9583196640014648, 1.0285189151763916, 1.0987181663513184, 1.1689174175262451, 1.2391166687011719, 1.3093159198760986, 1.3795151710510254, 1.4497144222259521, 1.519913673400879, 1.5901129245758057, 1.6603121757507324, 1.7305114269256592, 1.800710678100586, 1.8709099292755127, 1.9411091804504395, 2.011308431625366, 2.081507682800293, 2.1517069339752197]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 8.0, 5.0, 11.0, 13.0, 20.0, 19.0, 43.0, 81.0, 131.0, 253.0, 515.0, 1164.0, 3306.0, 11711.0, 103406.0, 3962158.0, 94279.0, 11448.0, 3072.0, 1296.0, 563.0, 276.0, 176.0, 96.0, 60.0, 56.0, 33.0, 23.0, 17.0, 13.0, 10.0, 5.0, 2.0, 2.0, 3.0, 5.0, 1.0, 3.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5205078125, -0.5022354125976562, -0.4839630126953125, -0.46569061279296875, -0.447418212890625, -0.42914581298828125, -0.4108734130859375, -0.39260101318359375, -0.37432861328125, -0.35605621337890625, -0.3377838134765625, -0.31951141357421875, -0.301239013671875, -0.28296661376953125, -0.2646942138671875, -0.24642181396484375, -0.2281494140625, -0.20987701416015625, -0.1916046142578125, -0.17333221435546875, -0.155059814453125, -0.13678741455078125, -0.1185150146484375, -0.10024261474609375, -0.08197021484375, -0.06369781494140625, -0.0454254150390625, -0.02715301513671875, -0.008880615234375, 0.00939178466796875, 0.0276641845703125, 0.04593658447265625, 0.064208984375, 0.08248138427734375, 0.1007537841796875, 0.11902618408203125, 0.137298583984375, 0.15557098388671875, 0.1738433837890625, 0.19211578369140625, 0.21038818359375, 0.22866058349609375, 0.2469329833984375, 0.26520538330078125, 0.283477783203125, 0.30175018310546875, 0.3200225830078125, 0.33829498291015625, 0.3565673828125, 0.37483978271484375, 0.3931121826171875, 0.41138458251953125, 0.429656982421875, 0.44792938232421875, 0.4662017822265625, 0.48447418212890625, 0.50274658203125, 0.5210189819335938, 0.5392913818359375, 0.5575637817382812, 0.575836181640625, 0.5941085815429688, 0.6123809814453125, 0.6306533813476562, 0.64892578125]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 7.0, 10.0, 15.0, 24.0, 39.0, 40.0, 71.0, 95.0, 99.0, 102.0, 134.0, 98.0, 82.0, 62.0, 39.0, 34.0, 17.0, 13.0, 8.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1492919921875, -0.14429283142089844, -0.13929367065429688, -0.1342945098876953, -0.12929534912109375, -0.12429618835449219, -0.11929702758789062, -0.11429786682128906, -0.1092987060546875, -0.10429954528808594, -0.09930038452148438, -0.09430122375488281, -0.08930206298828125, -0.08430290222167969, -0.07930374145507812, -0.07430458068847656, -0.069305419921875, -0.06430625915527344, -0.059307098388671875, -0.05430793762207031, -0.04930877685546875, -0.04430961608886719, -0.039310455322265625, -0.03431129455566406, -0.0293121337890625, -0.024312973022460938, -0.019313812255859375, -0.014314651489257812, -0.00931549072265625, -0.0043163299560546875, 0.000682830810546875, 0.0056819915771484375, 0.01068115234375, 0.015680313110351562, 0.020679473876953125, 0.025678634643554688, 0.03067779541015625, 0.03567695617675781, 0.040676116943359375, 0.04567527770996094, 0.0506744384765625, 0.05567359924316406, 0.060672760009765625, 0.06567192077636719, 0.07067108154296875, 0.07567024230957031, 0.08066940307617188, 0.08566856384277344, 0.090667724609375, 0.09566688537597656, 0.10066604614257812, 0.10566520690917969, 0.11066436767578125, 0.11566352844238281, 0.12066268920898438, 0.12566184997558594, 0.1306610107421875, 0.13566017150878906, 0.14065933227539062, 0.1456584930419922, 0.15065765380859375, 0.1556568145751953, 0.16065597534179688, 0.16565513610839844, 0.170654296875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 4.0, 2.0, 5.0, 14.0, 10.0, 22.0, 30.0, 42.0, 65.0, 105.0, 166.0, 297.0, 538.0, 969.0, 2116.0, 5619.0, 20177.0, 130557.0, 3324234.0, 641029.0, 49631.0, 11169.0, 3903.0, 1625.0, 809.0, 456.0, 258.0, 164.0, 98.0, 66.0, 42.0, 24.0, 15.0, 11.0, 4.0, 1.0, 3.0, 6.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.28466796875, -0.27597808837890625, -0.2672882080078125, -0.25859832763671875, -0.249908447265625, -0.24121856689453125, -0.2325286865234375, -0.22383880615234375, -0.21514892578125, -0.20645904541015625, -0.1977691650390625, -0.18907928466796875, -0.180389404296875, -0.17169952392578125, -0.1630096435546875, -0.15431976318359375, -0.1456298828125, -0.13694000244140625, -0.1282501220703125, -0.11956024169921875, -0.110870361328125, -0.10218048095703125, -0.0934906005859375, -0.08480072021484375, -0.07611083984375, -0.06742095947265625, -0.0587310791015625, -0.05004119873046875, -0.041351318359375, -0.03266143798828125, -0.0239715576171875, -0.01528167724609375, -0.006591796875, 0.00209808349609375, 0.0107879638671875, 0.01947784423828125, 0.028167724609375, 0.03685760498046875, 0.0455474853515625, 0.05423736572265625, 0.06292724609375, 0.07161712646484375, 0.0803070068359375, 0.08899688720703125, 0.097686767578125, 0.10637664794921875, 0.1150665283203125, 0.12375640869140625, 0.1324462890625, 0.14113616943359375, 0.1498260498046875, 0.15851593017578125, 0.167205810546875, 0.17589569091796875, 0.1845855712890625, 0.19327545166015625, 0.20196533203125, 0.21065521240234375, 0.2193450927734375, 0.22803497314453125, 0.236724853515625, 0.24541473388671875, 0.2541046142578125, 0.26279449462890625, 0.271484375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 1.0, 3.0, 4.0, 4.0, 15.0, 5.0, 15.0, 30.0, 31.0, 74.0, 124.0, 297.0, 848.0, 1569.0, 546.0, 216.0, 108.0, 63.0, 34.0, 24.0, 16.0, 12.0, 9.0, 7.0, 5.0, 4.0, 4.0, 2.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1004638671875, -0.09725093841552734, -0.09403800964355469, -0.09082508087158203, -0.08761215209960938, -0.08439922332763672, -0.08118629455566406, -0.0779733657836914, -0.07476043701171875, -0.0715475082397461, -0.06833457946777344, -0.06512165069580078, -0.061908721923828125, -0.05869579315185547, -0.05548286437988281, -0.052269935607910156, -0.0490570068359375, -0.045844078063964844, -0.04263114929199219, -0.03941822052001953, -0.036205291748046875, -0.03299236297607422, -0.029779434204101562, -0.026566505432128906, -0.02335357666015625, -0.020140647888183594, -0.016927719116210938, -0.013714790344238281, -0.010501861572265625, -0.007288932800292969, -0.0040760040283203125, -0.0008630752563476562, 0.002349853515625, 0.005562782287597656, 0.008775711059570312, 0.011988639831542969, 0.015201568603515625, 0.01841449737548828, 0.021627426147460938, 0.024840354919433594, 0.02805328369140625, 0.031266212463378906, 0.03447914123535156, 0.03769207000732422, 0.040904998779296875, 0.04411792755126953, 0.04733085632324219, 0.050543785095214844, 0.0537567138671875, 0.056969642639160156, 0.06018257141113281, 0.06339550018310547, 0.06660842895507812, 0.06982135772705078, 0.07303428649902344, 0.0762472152709961, 0.07946014404296875, 0.0826730728149414, 0.08588600158691406, 0.08909893035888672, 0.09231185913085938, 0.09552478790283203, 0.09873771667480469, 0.10195064544677734, 0.10516357421875]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 2.0, 2.0, 6.0, 10.0, 30.0, 60.0, 124.0, 212.0, 223.0, 186.0, 76.0, 45.0, 14.0, 8.0, 7.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7238551378250122, -0.7037040591239929, -0.6835530400276184, -0.6634019613265991, -0.6432509422302246, -0.6230998635292053, -0.6029488444328308, -0.5827977657318115, -0.562646746635437, -0.5424956679344177, -0.5223446488380432, -0.5021935701370239, -0.4820425510406494, -0.4618914723396301, -0.4417404234409332, -0.42158937454223633, -0.40143829584121704, -0.38128724694252014, -0.36113619804382324, -0.34098514914512634, -0.32083410024642944, -0.30068302154541016, -0.28053197264671326, -0.26038092374801636, -0.24022987484931946, -0.22007882595062256, -0.19992777705192566, -0.17977671325206757, -0.15962566435337067, -0.13947461545467377, -0.11932355910539627, -0.09917250275611877, -0.0790213942527771, -0.0588703416287899, -0.038719289004802704, -0.018568236380815506, 0.001582816243171692, 0.02173386514186859, 0.04188492149114609, 0.062035977840423584, 0.08218702673912048, 0.10233807563781738, 0.12248913198709488, 0.14264018833637238, 0.16279123723506927, 0.18294228613376617, 0.20309334993362427, 0.22324439883232117, 0.24339544773101807, 0.26354649662971497, 0.28369754552841187, 0.30384859442710876, 0.32399964332580566, 0.34415072202682495, 0.36430177092552185, 0.38445281982421875, 0.40460386872291565, 0.42475491762161255, 0.44490596652030945, 0.46505701541900635, 0.48520809412002563, 0.5053591132164001, 0.5255101919174194, 0.545661211013794, 0.5658122897148132]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 2.0, 3.0, 6.0, 6.0, 9.0, 5.0, 13.0, 13.0, 14.0, 11.0, 20.0, 30.0, 23.0, 34.0, 30.0, 52.0, 52.0, 39.0, 45.0, 43.0, 43.0, 47.0, 46.0, 36.0, 40.0, 45.0, 49.0, 36.0, 35.0, 25.0, 33.0, 25.0, 18.0, 17.0, 13.0, 15.0, 11.0, 9.0, 3.0, 6.0, 2.0, 3.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.24737590551376343, -0.23817496001720428, -0.22897401452064514, -0.219773069024086, -0.21057212352752686, -0.2013711780309677, -0.19217023253440857, -0.18296928703784943, -0.17376834154129028, -0.16456739604473114, -0.155366450548172, -0.14616550505161285, -0.1369645595550537, -0.12776361405849457, -0.11856266856193542, -0.10936172306537628, -0.10016077756881714, -0.090959832072258, -0.08175888657569885, -0.07255794107913971, -0.06335699558258057, -0.05415605008602142, -0.04495510458946228, -0.03575415909290314, -0.026553213596343994, -0.01735226809978485, -0.008151322603225708, 0.001049622893333435, 0.010250568389892578, 0.01945151388645172, 0.028652459383010864, 0.03785340487957001, 0.04705435037612915, 0.05625529587268829, 0.06545624136924744, 0.07465718686580658, 0.08385813236236572, 0.09305907785892487, 0.10226002335548401, 0.11146096885204315, 0.1206619143486023, 0.12986285984516144, 0.13906380534172058, 0.14826475083827972, 0.15746569633483887, 0.166666641831398, 0.17586758732795715, 0.1850685328245163, 0.19426947832107544, 0.20347042381763458, 0.21267136931419373, 0.22187231481075287, 0.231073260307312, 0.24027420580387115, 0.2494751513004303, 0.25867611169815063, 0.2678770422935486, 0.27707797288894653, 0.28627893328666687, 0.2954798936843872, 0.30468082427978516, 0.3138817548751831, 0.32308271527290344, 0.3322836756706238, 0.34148460626602173]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 4.0, 8.0, 10.0, 15.0, 14.0, 33.0, 30.0, 55.0, 62.0, 126.0, 160.0, 278.0, 466.0, 761.0, 1500.0, 3517.0, 9578.0, 33778.0, 177569.0, 593018.0, 176965.0, 34001.0, 9641.0, 3396.0, 1550.0, 765.0, 464.0, 233.0, 183.0, 113.0, 70.0, 58.0, 34.0, 32.0, 19.0, 12.0, 14.0, 9.0, 2.0, 3.0, 5.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.3623046875, -0.35042572021484375, -0.3385467529296875, -0.32666778564453125, -0.314788818359375, -0.30290985107421875, -0.2910308837890625, -0.27915191650390625, -0.26727294921875, -0.25539398193359375, -0.2435150146484375, -0.23163604736328125, -0.219757080078125, -0.20787811279296875, -0.1959991455078125, -0.18412017822265625, -0.1722412109375, -0.16036224365234375, -0.1484832763671875, -0.13660430908203125, -0.124725341796875, -0.11284637451171875, -0.1009674072265625, -0.08908843994140625, -0.07720947265625, -0.06533050537109375, -0.0534515380859375, -0.04157257080078125, -0.029693603515625, -0.01781463623046875, -0.0059356689453125, 0.00594329833984375, 0.017822265625, 0.02970123291015625, 0.0415802001953125, 0.05345916748046875, 0.065338134765625, 0.07721710205078125, 0.0890960693359375, 0.10097503662109375, 0.11285400390625, 0.12473297119140625, 0.1366119384765625, 0.14849090576171875, 0.160369873046875, 0.17224884033203125, 0.1841278076171875, 0.19600677490234375, 0.2078857421875, 0.21976470947265625, 0.2316436767578125, 0.24352264404296875, 0.255401611328125, 0.26728057861328125, 0.2791595458984375, 0.29103851318359375, 0.30291748046875, 0.31479644775390625, 0.3266754150390625, 0.33855438232421875, 0.350433349609375, 0.36231231689453125, 0.3741912841796875, 0.38607025146484375, 0.39794921875]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 12.0, 8.0, 9.0, 23.0, 39.0, 36.0, 66.0, 84.0, 114.0, 96.0, 133.0, 101.0, 77.0, 77.0, 46.0, 26.0, 23.0, 14.0, 7.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1505126953125, -0.14550209045410156, -0.14049148559570312, -0.1354808807373047, -0.13047027587890625, -0.1254596710205078, -0.12044906616210938, -0.11543846130371094, -0.1104278564453125, -0.10541725158691406, -0.10040664672851562, -0.09539604187011719, -0.09038543701171875, -0.08537483215332031, -0.08036422729492188, -0.07535362243652344, -0.070343017578125, -0.06533241271972656, -0.060321807861328125, -0.05531120300292969, -0.05030059814453125, -0.04528999328613281, -0.040279388427734375, -0.03526878356933594, -0.0302581787109375, -0.025247573852539062, -0.020236968994140625, -0.015226364135742188, -0.01021575927734375, -0.0052051544189453125, -0.000194549560546875, 0.0048160552978515625, 0.00982666015625, 0.014837265014648438, 0.019847869873046875, 0.024858474731445312, 0.02986907958984375, 0.03487968444824219, 0.039890289306640625, 0.04490089416503906, 0.0499114990234375, 0.05492210388183594, 0.059932708740234375, 0.06494331359863281, 0.06995391845703125, 0.07496452331542969, 0.07997512817382812, 0.08498573303222656, 0.089996337890625, 0.09500694274902344, 0.10001754760742188, 0.10502815246582031, 0.11003875732421875, 0.11504936218261719, 0.12005996704101562, 0.12507057189941406, 0.1300811767578125, 0.13509178161621094, 0.14010238647460938, 0.1451129913330078, 0.15012359619140625, 0.1551342010498047, 0.16014480590820312, 0.16515541076660156, 0.170166015625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 13.0, 8.0, 12.0, 13.0, 20.0, 30.0, 46.0, 43.0, 63.0, 102.0, 136.0, 178.0, 276.0, 493.0, 742.0, 1422.0, 2668.0, 5632.0, 12721.0, 33439.0, 104741.0, 352142.0, 363012.0, 110387.0, 34658.0, 13466.0, 5795.0, 2736.0, 1403.0, 774.0, 434.0, 297.0, 173.0, 135.0, 93.0, 70.0, 54.0, 34.0, 25.0, 17.0, 12.0, 8.0, 4.0, 6.0, 8.0, 6.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.2548828125, -0.24666595458984375, -0.2384490966796875, -0.23023223876953125, -0.222015380859375, -0.21379852294921875, -0.2055816650390625, -0.19736480712890625, -0.18914794921875, -0.18093109130859375, -0.1727142333984375, -0.16449737548828125, -0.156280517578125, -0.14806365966796875, -0.1398468017578125, -0.13162994384765625, -0.1234130859375, -0.11519622802734375, -0.1069793701171875, -0.09876251220703125, -0.090545654296875, -0.08232879638671875, -0.0741119384765625, -0.06589508056640625, -0.05767822265625, -0.04946136474609375, -0.0412445068359375, -0.03302764892578125, -0.024810791015625, -0.01659393310546875, -0.0083770751953125, -0.00016021728515625, 0.008056640625, 0.01627349853515625, 0.0244903564453125, 0.03270721435546875, 0.040924072265625, 0.04914093017578125, 0.0573577880859375, 0.06557464599609375, 0.07379150390625, 0.08200836181640625, 0.0902252197265625, 0.09844207763671875, 0.106658935546875, 0.11487579345703125, 0.1230926513671875, 0.13130950927734375, 0.1395263671875, 0.14774322509765625, 0.1559600830078125, 0.16417694091796875, 0.172393798828125, 0.18061065673828125, 0.1888275146484375, 0.19704437255859375, 0.20526123046875, 0.21347808837890625, 0.2216949462890625, 0.22991180419921875, 0.238128662109375, 0.24634552001953125, 0.2545623779296875, 0.26277923583984375, 0.27099609375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 4.0, 2.0, 8.0, 8.0, 6.0, 7.0, 8.0, 9.0, 7.0, 21.0, 23.0, 23.0, 34.0, 31.0, 34.0, 33.0, 32.0, 39.0, 52.0, 61.0, 46.0, 54.0, 45.0, 44.0, 42.0, 42.0, 39.0, 35.0, 35.0, 22.0, 26.0, 20.0, 25.0, 14.0, 12.0, 16.0, 8.0, 9.0, 7.0, 6.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.353515625, -0.3412284851074219, -0.32894134521484375, -0.3166542053222656, -0.3043670654296875, -0.2920799255371094, -0.27979278564453125, -0.2675056457519531, -0.255218505859375, -0.24293136596679688, -0.23064422607421875, -0.21835708618164062, -0.2060699462890625, -0.19378280639648438, -0.18149566650390625, -0.16920852661132812, -0.15692138671875, -0.14463424682617188, -0.13234710693359375, -0.12005996704101562, -0.1077728271484375, -0.09548568725585938, -0.08319854736328125, -0.07091140747070312, -0.058624267578125, -0.046337127685546875, -0.03404998779296875, -0.021762847900390625, -0.0094757080078125, 0.002811431884765625, 0.01509857177734375, 0.027385711669921875, 0.0396728515625, 0.051959991455078125, 0.06424713134765625, 0.07653427124023438, 0.0888214111328125, 0.10110855102539062, 0.11339569091796875, 0.12568283081054688, 0.137969970703125, 0.15025711059570312, 0.16254425048828125, 0.17483139038085938, 0.1871185302734375, 0.19940567016601562, 0.21169281005859375, 0.22397994995117188, 0.23626708984375, 0.24855422973632812, 0.26084136962890625, 0.2731285095214844, 0.2854156494140625, 0.2977027893066406, 0.30998992919921875, 0.3222770690917969, 0.334564208984375, 0.3468513488769531, 0.35913848876953125, 0.3714256286621094, 0.3837127685546875, 0.3959999084472656, 0.40828704833984375, 0.4205741882324219, 0.432861328125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 7.0, 6.0, 7.0, 23.0, 68.0, 162.0, 629.0, 4230.0, 108011.0, 888239.0, 43986.0, 2514.0, 450.0, 136.0, 44.0, 26.0, 11.0, 3.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13525390625, -0.12827682495117188, -0.12129974365234375, -0.11432266235351562, -0.1073455810546875, -0.10036849975585938, -0.09339141845703125, -0.08641433715820312, -0.079437255859375, -0.07246017456054688, -0.06548309326171875, -0.058506011962890625, -0.0515289306640625, -0.044551849365234375, -0.03757476806640625, -0.030597686767578125, -0.02362060546875, -0.016643524169921875, -0.00966644287109375, -0.002689361572265625, 0.0042877197265625, 0.011264801025390625, 0.01824188232421875, 0.025218963623046875, 0.032196044921875, 0.039173126220703125, 0.04615020751953125, 0.053127288818359375, 0.0601043701171875, 0.06708145141601562, 0.07405853271484375, 0.08103561401367188, 0.0880126953125, 0.09498977661132812, 0.10196685791015625, 0.10894393920898438, 0.1159210205078125, 0.12289810180664062, 0.12987518310546875, 0.13685226440429688, 0.143829345703125, 0.15080642700195312, 0.15778350830078125, 0.16476058959960938, 0.1717376708984375, 0.17871475219726562, 0.18569183349609375, 0.19266891479492188, 0.19964599609375, 0.20662307739257812, 0.21360015869140625, 0.22057723999023438, 0.2275543212890625, 0.23453140258789062, 0.24150848388671875, 0.24848556518554688, 0.255462646484375, 0.2624397277832031, 0.26941680908203125, 0.2763938903808594, 0.2833709716796875, 0.2903480529785156, 0.29732513427734375, 0.3043022155761719, 0.311279296875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 1.0, 5.0, 3.0, 5.0, 8.0, 7.0, 5.0, 16.0, 10.0, 21.0, 17.0, 21.0, 43.0, 53.0, 78.0, 96.0, 111.0, 113.0, 89.0, 63.0, 63.0, 33.0, 20.0, 31.0, 15.0, 7.0, 10.0, 9.0, 12.0, 10.0, 5.0, 3.0, 6.0, 4.0, 2.0, 5.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0], "bins": [-0.00010967254638671875, -0.00010677520185709, -0.00010387785732746124, -0.00010098051279783249, -9.808316826820374e-05, -9.518582373857498e-05, -9.228847920894623e-05, -8.939113467931747e-05, -8.649379014968872e-05, -8.359644562005997e-05, -8.069910109043121e-05, -7.780175656080246e-05, -7.49044120311737e-05, -7.200706750154495e-05, -6.91097229719162e-05, -6.621237844228745e-05, -6.331503391265869e-05, -6.041768938302994e-05, -5.7520344853401184e-05, -5.462300032377243e-05, -5.172565579414368e-05, -4.882831126451492e-05, -4.593096673488617e-05, -4.3033622205257416e-05, -4.013627767562866e-05, -3.723893314599991e-05, -3.4341588616371155e-05, -3.14442440867424e-05, -2.8546899557113647e-05, -2.5649555027484894e-05, -2.275221049785614e-05, -1.9854865968227386e-05, -1.6957521438598633e-05, -1.4060176908969879e-05, -1.1162832379341125e-05, -8.265487849712372e-06, -5.368143320083618e-06, -2.4707987904548645e-06, 4.2654573917388916e-07, 3.323890268802643e-06, 6.2212347984313965e-06, 9.11857932806015e-06, 1.2015923857688904e-05, 1.4913268387317657e-05, 1.781061291694641e-05, 2.0707957446575165e-05, 2.360530197620392e-05, 2.6502646505832672e-05, 2.9399991035461426e-05, 3.229733556509018e-05, 3.519468009471893e-05, 3.809202462434769e-05, 4.098936915397644e-05, 4.3886713683605194e-05, 4.678405821323395e-05, 4.96814027428627e-05, 5.2578747272491455e-05, 5.547609180212021e-05, 5.837343633174896e-05, 6.127078086137772e-05, 6.416812539100647e-05, 6.706546992063522e-05, 6.996281445026398e-05, 7.286015897989273e-05, 7.575750350952148e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 12.0, 23.0, 26.0, 20.0, 61.0, 89.0, 159.0, 417.0, 1098.0, 4066.0, 31315.0, 528517.0, 450750.0, 26588.0, 3614.0, 1023.0, 370.0, 186.0, 83.0, 45.0, 30.0, 23.0, 13.0, 14.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.2215576171875, -0.21614933013916016, -0.2107410430908203, -0.20533275604248047, -0.19992446899414062, -0.19451618194580078, -0.18910789489746094, -0.1836996078491211, -0.17829132080078125, -0.1728830337524414, -0.16747474670410156, -0.16206645965576172, -0.15665817260742188, -0.15124988555908203, -0.1458415985107422, -0.14043331146240234, -0.1350250244140625, -0.12961673736572266, -0.12420845031738281, -0.11880016326904297, -0.11339187622070312, -0.10798358917236328, -0.10257530212402344, -0.0971670150756836, -0.09175872802734375, -0.0863504409790039, -0.08094215393066406, -0.07553386688232422, -0.07012557983398438, -0.06471729278564453, -0.05930900573730469, -0.053900718688964844, -0.048492431640625, -0.043084144592285156, -0.03767585754394531, -0.03226757049560547, -0.026859283447265625, -0.02145099639892578, -0.016042709350585938, -0.010634422302246094, -0.00522613525390625, 0.00018215179443359375, 0.0055904388427734375, 0.010998725891113281, 0.016407012939453125, 0.02181529998779297, 0.027223587036132812, 0.032631874084472656, 0.0380401611328125, 0.043448448181152344, 0.04885673522949219, 0.05426502227783203, 0.059673309326171875, 0.06508159637451172, 0.07048988342285156, 0.0758981704711914, 0.08130645751953125, 0.0867147445678711, 0.09212303161621094, 0.09753131866455078, 0.10293960571289062, 0.10834789276123047, 0.11375617980957031, 0.11916446685791016, 0.12457275390625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 4.0, 9.0, 14.0, 35.0, 68.0, 133.0, 176.0, 187.0, 168.0, 92.0, 62.0, 25.0, 16.0, 11.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.285400390625, -0.27924633026123047, -0.27309226989746094, -0.2669382095336914, -0.2607841491699219, -0.25463008880615234, -0.2484760284423828, -0.24232196807861328, -0.23616790771484375, -0.23001384735107422, -0.2238597869873047, -0.21770572662353516, -0.21155166625976562, -0.2053976058959961, -0.19924354553222656, -0.19308948516845703, -0.1869354248046875, -0.18078136444091797, -0.17462730407714844, -0.1684732437133789, -0.16231918334960938, -0.15616512298583984, -0.1500110626220703, -0.14385700225830078, -0.13770294189453125, -0.13154888153076172, -0.1253948211669922, -0.11924076080322266, -0.11308670043945312, -0.1069326400756836, -0.10077857971191406, -0.09462451934814453, -0.088470458984375, -0.08231639862060547, -0.07616233825683594, -0.0700082778930664, -0.06385421752929688, -0.057700157165527344, -0.05154609680175781, -0.04539203643798828, -0.03923797607421875, -0.03308391571044922, -0.026929855346679688, -0.020775794982910156, -0.014621734619140625, -0.008467674255371094, -0.0023136138916015625, 0.0038404464721679688, 0.0099945068359375, 0.01614856719970703, 0.022302627563476562, 0.028456687927246094, 0.034610748291015625, 0.040764808654785156, 0.04691886901855469, 0.05307292938232422, 0.05922698974609375, 0.06538105010986328, 0.07153511047363281, 0.07768917083740234, 0.08384323120117188, 0.0899972915649414, 0.09615135192871094, 0.10230541229248047, 0.10845947265625]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 8.0, 6.0, 10.0, 19.0, 29.0, 61.0, 86.0, 130.0, 177.0, 171.0, 132.0, 61.0, 44.0, 28.0, 12.0, 8.0, 7.0, 10.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2139188051223755, -1.1486256122589111, -1.0833325386047363, -1.018039345741272, -0.9527461528778076, -0.8874529600143433, -0.8221598267555237, -0.7568666934967041, -0.6915735006332397, -0.6262803077697754, -0.5609871745109558, -0.49569401144981384, -0.4304008483886719, -0.3651076853275299, -0.29981452226638794, -0.23452135920524597, -0.169228196144104, -0.10393503308296204, -0.03864187002182007, 0.0266512930393219, 0.09194445610046387, 0.15723761916160583, 0.2225307822227478, 0.28782394528388977, 0.35311710834503174, 0.4184102714061737, 0.4837034344673157, 0.5489965677261353, 0.6142897605895996, 0.679582953453064, 0.7448760867118835, 0.8101692199707031, 0.875462532043457, 0.9407557249069214, 1.0060489177703857, 1.0713419914245605, 1.136635184288025, 1.2019283771514893, 1.267221450805664, 1.3325146436691284, 1.3978078365325928, 1.4631010293960571, 1.5283942222595215, 1.5936872959136963, 1.6589804887771606, 1.724273681640625, 1.7895667552947998, 1.8548599481582642, 1.9201531410217285, 1.9854463338851929, 2.0507395267486572, 2.116032600402832, 2.181325912475586, 2.2466189861297607, 2.3119120597839355, 2.3772053718566895, 2.4424984455108643, 2.507791519165039, 2.573084831237793, 2.6383779048919678, 2.7036709785461426, 2.7689642906188965, 2.8342573642730713, 2.899550676345825, 2.96484375]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 11.0, 11.0, 9.0, 6.0, 13.0, 25.0, 21.0, 32.0, 29.0, 30.0, 53.0, 49.0, 60.0, 60.0, 55.0, 83.0, 56.0, 61.0, 55.0, 40.0, 48.0, 33.0, 36.0, 24.0, 18.0, 25.0, 14.0, 15.0, 8.0, 9.0, 4.0, 2.0, 3.0, 5.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.435960054397583, -3.350484848022461, -3.265009880065918, -3.179534673690796, -3.094059467315674, -3.008584499359131, -2.923109292984009, -2.8376340866088867, -2.7521591186523438, -2.6666839122772217, -2.5812089443206787, -2.4957337379455566, -2.4102585315704346, -2.3247833251953125, -2.2393083572387695, -2.1538331508636475, -2.0683579444885254, -1.9828828573226929, -1.8974076509475708, -1.8119325637817383, -1.7264573574066162, -1.6409822702407837, -1.5555071830749512, -1.470031976699829, -1.3845568895339966, -1.299081802368164, -1.213606595993042, -1.1281315088272095, -1.042656421661377, -0.9571812152862549, -0.8717061281204224, -0.7862309813499451, -0.7007555961608887, -0.6152804493904114, -0.5298053026199341, -0.44433021545410156, -0.35885506868362427, -0.273379921913147, -0.18790483474731445, -0.10242968797683716, -0.016954541206359863, 0.06852059066295624, 0.15399572253227234, 0.23947083950042725, 0.32494598627090454, 0.41042113304138184, 0.49589622020721436, 0.5813713669776917, 0.666846513748169, 0.7523216605186462, 0.8377968072891235, 0.923271894454956, 1.0087471008300781, 1.0942221879959106, 1.1796972751617432, 1.2651724815368652, 1.3506475687026978, 1.4361226558685303, 1.5215978622436523, 1.6070729494094849, 1.6925480365753174, 1.7780232429504395, 1.863498330116272, 1.9489734172821045, 2.0344486236572266]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 10.0, 5.0, 10.0, 7.0, 16.0, 13.0, 35.0, 38.0, 68.0, 68.0, 127.0, 224.0, 389.0, 752.0, 1418.0, 3136.0, 8191.0, 32285.0, 398977.0, 3643523.0, 80888.0, 14847.0, 4782.0, 2006.0, 990.0, 532.0, 321.0, 206.0, 110.0, 83.0, 48.0, 43.0, 31.0, 22.0, 20.0, 11.0, 12.0, 7.0, 4.0, 12.0, 4.0, 0.0, 2.0, 2.0, 4.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.4423828125, -0.42725372314453125, -0.4121246337890625, -0.39699554443359375, -0.381866455078125, -0.36673736572265625, -0.3516082763671875, -0.33647918701171875, -0.32135009765625, -0.30622100830078125, -0.2910919189453125, -0.27596282958984375, -0.260833740234375, -0.24570465087890625, -0.2305755615234375, -0.21544647216796875, -0.2003173828125, -0.18518829345703125, -0.1700592041015625, -0.15493011474609375, -0.139801025390625, -0.12467193603515625, -0.1095428466796875, -0.09441375732421875, -0.07928466796875, -0.06415557861328125, -0.0490264892578125, -0.03389739990234375, -0.018768310546875, -0.00363922119140625, 0.0114898681640625, 0.02661895751953125, 0.041748046875, 0.05687713623046875, 0.0720062255859375, 0.08713531494140625, 0.102264404296875, 0.11739349365234375, 0.1325225830078125, 0.14765167236328125, 0.16278076171875, 0.17790985107421875, 0.1930389404296875, 0.20816802978515625, 0.223297119140625, 0.23842620849609375, 0.2535552978515625, 0.26868438720703125, 0.2838134765625, 0.29894256591796875, 0.3140716552734375, 0.32920074462890625, 0.344329833984375, 0.35945892333984375, 0.3745880126953125, 0.38971710205078125, 0.40484619140625, 0.41997528076171875, 0.4351043701171875, 0.45023345947265625, 0.465362548828125, 0.48049163818359375, 0.4956207275390625, 0.5107498168945312, 0.52587890625]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 5.0, 7.0, 13.0, 25.0, 32.0, 36.0, 50.0, 50.0, 100.0, 100.0, 97.0, 96.0, 108.0, 86.0, 47.0, 34.0, 39.0, 22.0, 18.0, 11.0, 7.0, 6.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1312255859375, -0.1266632080078125, -0.122100830078125, -0.1175384521484375, -0.11297607421875, -0.1084136962890625, -0.103851318359375, -0.0992889404296875, -0.0947265625, -0.0901641845703125, -0.085601806640625, -0.0810394287109375, -0.07647705078125, -0.0719146728515625, -0.067352294921875, -0.0627899169921875, -0.0582275390625, -0.0536651611328125, -0.049102783203125, -0.0445404052734375, -0.03997802734375, -0.0354156494140625, -0.030853271484375, -0.0262908935546875, -0.021728515625, -0.0171661376953125, -0.012603759765625, -0.0080413818359375, -0.00347900390625, 0.0010833740234375, 0.005645751953125, 0.0102081298828125, 0.0147705078125, 0.0193328857421875, 0.023895263671875, 0.0284576416015625, 0.03302001953125, 0.0375823974609375, 0.042144775390625, 0.0467071533203125, 0.05126953125, 0.0558319091796875, 0.060394287109375, 0.0649566650390625, 0.06951904296875, 0.0740814208984375, 0.078643798828125, 0.0832061767578125, 0.0877685546875, 0.0923309326171875, 0.096893310546875, 0.1014556884765625, 0.10601806640625, 0.1105804443359375, 0.115142822265625, 0.1197052001953125, 0.124267578125, 0.1288299560546875, 0.133392333984375, 0.1379547119140625, 0.14251708984375, 0.1470794677734375, 0.151641845703125, 0.1562042236328125, 0.1607666015625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 8.0, 7.0, 10.0, 15.0, 23.0, 49.0, 74.0, 96.0, 170.0, 300.0, 531.0, 966.0, 1808.0, 3871.0, 10017.0, 44853.0, 695212.0, 3299438.0, 108305.0, 18161.0, 5490.0, 2301.0, 1132.0, 570.0, 334.0, 205.0, 120.0, 57.0, 42.0, 36.0, 27.0, 17.0, 10.0, 9.0, 6.0, 7.0, 5.0, 2.0, 1.0, 3.0], "bins": [-0.42333984375, -0.41306495666503906, -0.4027900695800781, -0.3925151824951172, -0.38224029541015625, -0.3719654083251953, -0.3616905212402344, -0.35141563415527344, -0.3411407470703125, -0.33086585998535156, -0.3205909729003906, -0.3103160858154297, -0.30004119873046875, -0.2897663116455078, -0.2794914245605469, -0.26921653747558594, -0.258941650390625, -0.24866676330566406, -0.23839187622070312, -0.2281169891357422, -0.21784210205078125, -0.2075672149658203, -0.19729232788085938, -0.18701744079589844, -0.1767425537109375, -0.16646766662597656, -0.15619277954101562, -0.1459178924560547, -0.13564300537109375, -0.1253681182861328, -0.11509323120117188, -0.10481834411621094, -0.09454345703125, -0.08426856994628906, -0.07399368286132812, -0.06371879577636719, -0.05344390869140625, -0.04316902160644531, -0.032894134521484375, -0.022619247436523438, -0.0123443603515625, -0.0020694732666015625, 0.008205413818359375, 0.018480300903320312, 0.02875518798828125, 0.03903007507324219, 0.049304962158203125, 0.05957984924316406, 0.069854736328125, 0.08012962341308594, 0.09040451049804688, 0.10067939758300781, 0.11095428466796875, 0.12122917175292969, 0.13150405883789062, 0.14177894592285156, 0.1520538330078125, 0.16232872009277344, 0.17260360717773438, 0.1828784942626953, 0.19315338134765625, 0.2034282684326172, 0.21370315551757812, 0.22397804260253906, 0.2342529296875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 4.0, 8.0, 9.0, 6.0, 16.0, 32.0, 71.0, 139.0, 341.0, 1633.0, 1219.0, 312.0, 119.0, 59.0, 40.0, 20.0, 18.0, 5.0, 15.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.20947265625, -0.20246315002441406, -0.19545364379882812, -0.1884441375732422, -0.18143463134765625, -0.1744251251220703, -0.16741561889648438, -0.16040611267089844, -0.1533966064453125, -0.14638710021972656, -0.13937759399414062, -0.1323680877685547, -0.12535858154296875, -0.11834907531738281, -0.11133956909179688, -0.10433006286621094, -0.097320556640625, -0.09031105041503906, -0.08330154418945312, -0.07629203796386719, -0.06928253173828125, -0.06227302551269531, -0.055263519287109375, -0.04825401306152344, -0.0412445068359375, -0.03423500061035156, -0.027225494384765625, -0.020215988159179688, -0.01320648193359375, -0.0061969757080078125, 0.000812530517578125, 0.007822036743164062, 0.01483154296875, 0.021841049194335938, 0.028850555419921875, 0.03586006164550781, 0.04286956787109375, 0.04987907409667969, 0.056888580322265625, 0.06389808654785156, 0.0709075927734375, 0.07791709899902344, 0.08492660522460938, 0.09193611145019531, 0.09894561767578125, 0.10595512390136719, 0.11296463012695312, 0.11997413635253906, 0.126983642578125, 0.13399314880371094, 0.14100265502929688, 0.1480121612548828, 0.15502166748046875, 0.1620311737060547, 0.16904067993164062, 0.17605018615722656, 0.1830596923828125, 0.19006919860839844, 0.19707870483398438, 0.2040882110595703, 0.21109771728515625, 0.2181072235107422, 0.22511672973632812, 0.23212623596191406, 0.2391357421875]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 6.0, 10.0, 9.0, 29.0, 67.0, 130.0, 217.0, 223.0, 159.0, 94.0, 35.0, 10.0, 7.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8653675317764282, -0.8305153846740723, -0.7956632375717163, -0.7608110308647156, -0.7259588837623596, -0.6911067366600037, -0.6562545299530029, -0.621402382850647, -0.586550235748291, -0.5516980886459351, -0.5168459415435791, -0.48199373483657837, -0.4471415877342224, -0.41228944063186646, -0.3774372637271881, -0.34258508682250977, -0.3077329397201538, -0.27288079261779785, -0.2380286157131195, -0.20317645370960236, -0.1683242917060852, -0.13347212970256805, -0.0986199676990509, -0.06376780569553375, -0.0289156436920166, 0.005936518311500549, 0.0407886803150177, 0.07564084231853485, 0.110493004322052, 0.14534516632556915, 0.1801973283290863, 0.21504949033260345, 0.24990177154541016, 0.2847539186477661, 0.31960609555244446, 0.3544582724571228, 0.38931041955947876, 0.4241625666618347, 0.45901474356651306, 0.4938669204711914, 0.5287190675735474, 0.5635712146759033, 0.5984233617782593, 0.63327556848526, 0.668127715587616, 0.7029798626899719, 0.7378320693969727, 0.7726842164993286, 0.8075363636016846, 0.8423885107040405, 0.8772406578063965, 0.9120928645133972, 0.9469450116157532, 0.9817971587181091, 1.0166493654251099, 1.0515015125274658, 1.0863536596298218, 1.1212058067321777, 1.1560579538345337, 1.1909101009368896, 1.2257623672485352, 1.2606145143508911, 1.295466661453247, 1.330318808555603, 1.365170955657959]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 7.0, 5.0, 7.0, 14.0, 17.0, 21.0, 25.0, 29.0, 52.0, 52.0, 70.0, 63.0, 62.0, 76.0, 78.0, 77.0, 77.0, 42.0, 49.0, 42.0, 42.0, 25.0, 18.0, 19.0, 11.0, 12.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6058604121208191, -0.5822413563728333, -0.5586223602294922, -0.5350033044815063, -0.5113843083381653, -0.48776525259017944, -0.464146226644516, -0.44052720069885254, -0.4169081449508667, -0.39328911900520325, -0.3696700930595398, -0.34605103731155396, -0.3224320113658905, -0.29881298542022705, -0.2751939594745636, -0.25157493352890015, -0.2279559075832367, -0.20433688163757324, -0.1807178407907486, -0.15709881484508514, -0.1334797739982605, -0.10986074805259705, -0.0862417221069336, -0.06262268126010895, -0.039003655314445496, -0.015384623780846596, 0.008234407752752304, 0.031853437423706055, 0.055472470819950104, 0.07909150421619415, 0.1027105301618576, 0.12632957100868225, 0.1499485969543457, 0.17356762290000916, 0.1971866637468338, 0.22080568969249725, 0.2444247305393219, 0.26804375648498535, 0.2916627824306488, 0.31528180837631226, 0.3389008641242981, 0.36251989006996155, 0.386138916015625, 0.40975797176361084, 0.4333769977092743, 0.45699602365493774, 0.4806150496006012, 0.5042340755462646, 0.5278531312942505, 0.5514721870422363, 0.5750911831855774, 0.5987102389335632, 0.6223292350769043, 0.6459482908248901, 0.669567346572876, 0.693186342716217, 0.7168053388595581, 0.740424394607544, 0.764043390750885, 0.7876624464988708, 0.8112814426422119, 0.8349004983901978, 0.8585195541381836, 0.8821385502815247, 0.9057576060295105]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 8.0, 10.0, 14.0, 24.0, 58.0, 72.0, 138.0, 303.0, 685.0, 1713.0, 5988.0, 42290.0, 679861.0, 291914.0, 19424.0, 3742.0, 1228.0, 522.0, 274.0, 136.0, 60.0, 27.0, 17.0, 12.0, 11.0, 9.0, 4.0, 4.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.79052734375, -0.7678298950195312, -0.7451324462890625, -0.7224349975585938, -0.699737548828125, -0.6770401000976562, -0.6543426513671875, -0.6316452026367188, -0.60894775390625, -0.5862503051757812, -0.5635528564453125, -0.5408554077148438, -0.518157958984375, -0.49546051025390625, -0.4727630615234375, -0.45006561279296875, -0.4273681640625, -0.40467071533203125, -0.3819732666015625, -0.35927581787109375, -0.336578369140625, -0.31388092041015625, -0.2911834716796875, -0.26848602294921875, -0.24578857421875, -0.22309112548828125, -0.2003936767578125, -0.17769622802734375, -0.154998779296875, -0.13230133056640625, -0.1096038818359375, -0.08690643310546875, -0.064208984375, -0.04151153564453125, -0.0188140869140625, 0.00388336181640625, 0.026580810546875, 0.04927825927734375, 0.0719757080078125, 0.09467315673828125, 0.11737060546875, 0.14006805419921875, 0.1627655029296875, 0.18546295166015625, 0.208160400390625, 0.23085784912109375, 0.2535552978515625, 0.27625274658203125, 0.2989501953125, 0.32164764404296875, 0.3443450927734375, 0.36704254150390625, 0.389739990234375, 0.41243743896484375, 0.4351348876953125, 0.45783233642578125, 0.48052978515625, 0.5032272338867188, 0.5259246826171875, 0.5486221313476562, 0.571319580078125, 0.5940170288085938, 0.6167144775390625, 0.6394119262695312, 0.662109375]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 3.0, 8.0, 14.0, 21.0, 21.0, 54.0, 56.0, 60.0, 92.0, 122.0, 119.0, 104.0, 117.0, 59.0, 45.0, 38.0, 28.0, 10.0, 7.0, 12.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12030029296875, -0.11536312103271484, -0.11042594909667969, -0.10548877716064453, -0.10055160522460938, -0.09561443328857422, -0.09067726135253906, -0.0857400894165039, -0.08080291748046875, -0.0758657455444336, -0.07092857360839844, -0.06599140167236328, -0.061054229736328125, -0.05611705780029297, -0.05117988586425781, -0.046242713928222656, -0.0413055419921875, -0.036368370056152344, -0.03143119812011719, -0.02649402618408203, -0.021556854248046875, -0.01661968231201172, -0.011682510375976562, -0.006745338439941406, -0.00180816650390625, 0.0031290054321289062, 0.008066177368164062, 0.013003349304199219, 0.017940521240234375, 0.02287769317626953, 0.027814865112304688, 0.032752037048339844, 0.037689208984375, 0.042626380920410156, 0.04756355285644531, 0.05250072479248047, 0.057437896728515625, 0.06237506866455078, 0.06731224060058594, 0.0722494125366211, 0.07718658447265625, 0.0821237564086914, 0.08706092834472656, 0.09199810028076172, 0.09693527221679688, 0.10187244415283203, 0.10680961608886719, 0.11174678802490234, 0.1166839599609375, 0.12162113189697266, 0.1265583038330078, 0.13149547576904297, 0.13643264770507812, 0.14136981964111328, 0.14630699157714844, 0.1512441635131836, 0.15618133544921875, 0.1611185073852539, 0.16605567932128906, 0.17099285125732422, 0.17593002319335938, 0.18086719512939453, 0.1858043670654297, 0.19074153900146484, 0.1956787109375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 4.0, 3.0, 10.0, 18.0, 23.0, 46.0, 95.0, 162.0, 295.0, 677.0, 1594.0, 4427.0, 14306.0, 57077.0, 280408.0, 512205.0, 134802.0, 29525.0, 8127.0, 2746.0, 1041.0, 433.0, 217.0, 144.0, 82.0, 36.0, 28.0, 10.0, 7.0, 1.0, 6.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.24658203125, -0.23642349243164062, -0.22626495361328125, -0.21610641479492188, -0.2059478759765625, -0.19578933715820312, -0.18563079833984375, -0.17547225952148438, -0.165313720703125, -0.15515518188476562, -0.14499664306640625, -0.13483810424804688, -0.1246795654296875, -0.11452102661132812, -0.10436248779296875, -0.09420394897460938, -0.08404541015625, -0.07388687133789062, -0.06372833251953125, -0.053569793701171875, -0.0434112548828125, -0.033252716064453125, -0.02309417724609375, -0.012935638427734375, -0.002777099609375, 0.007381439208984375, 0.01753997802734375, 0.027698516845703125, 0.0378570556640625, 0.048015594482421875, 0.05817413330078125, 0.06833267211914062, 0.0784912109375, 0.08864974975585938, 0.09880828857421875, 0.10896682739257812, 0.1191253662109375, 0.12928390502929688, 0.13944244384765625, 0.14960098266601562, 0.159759521484375, 0.16991806030273438, 0.18007659912109375, 0.19023513793945312, 0.2003936767578125, 0.21055221557617188, 0.22071075439453125, 0.23086929321289062, 0.24102783203125, 0.2511863708496094, 0.26134490966796875, 0.2715034484863281, 0.2816619873046875, 0.2918205261230469, 0.30197906494140625, 0.3121376037597656, 0.322296142578125, 0.3324546813964844, 0.34261322021484375, 0.3527717590332031, 0.3629302978515625, 0.3730888366699219, 0.38324737548828125, 0.3934059143066406, 0.403564453125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 8.0, 2.0, 6.0, 7.0, 9.0, 5.0, 11.0, 16.0, 21.0, 18.0, 37.0, 23.0, 29.0, 27.0, 43.0, 30.0, 39.0, 43.0, 29.0, 51.0, 33.0, 44.0, 41.0, 43.0, 32.0, 43.0, 34.0, 35.0, 39.0, 33.0, 27.0, 23.0, 23.0, 18.0, 16.0, 8.0, 11.0, 9.0, 8.0, 11.0, 5.0, 7.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-0.363525390625, -0.35344696044921875, -0.3433685302734375, -0.33329010009765625, -0.323211669921875, -0.31313323974609375, -0.3030548095703125, -0.29297637939453125, -0.28289794921875, -0.27281951904296875, -0.2627410888671875, -0.25266265869140625, -0.242584228515625, -0.23250579833984375, -0.2224273681640625, -0.21234893798828125, -0.2022705078125, -0.19219207763671875, -0.1821136474609375, -0.17203521728515625, -0.161956787109375, -0.15187835693359375, -0.1417999267578125, -0.13172149658203125, -0.12164306640625, -0.11156463623046875, -0.1014862060546875, -0.09140777587890625, -0.081329345703125, -0.07125091552734375, -0.0611724853515625, -0.05109405517578125, -0.041015625, -0.03093719482421875, -0.0208587646484375, -0.01078033447265625, -0.000701904296875, 0.00937652587890625, 0.0194549560546875, 0.02953338623046875, 0.03961181640625, 0.04969024658203125, 0.0597686767578125, 0.06984710693359375, 0.079925537109375, 0.09000396728515625, 0.1000823974609375, 0.11016082763671875, 0.1202392578125, 0.13031768798828125, 0.1403961181640625, 0.15047454833984375, 0.160552978515625, 0.17063140869140625, 0.1807098388671875, 0.19078826904296875, 0.20086669921875, 0.21094512939453125, 0.2210235595703125, 0.23110198974609375, 0.241180419921875, 0.25125885009765625, 0.2613372802734375, 0.27141571044921875, 0.281494140625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 8.0, 2.0, 7.0, 13.0, 34.0, 85.0, 255.0, 1356.0, 40854.0, 988510.0, 16152.0, 963.0, 201.0, 71.0, 22.0, 12.0, 4.0, 7.0, 5.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.427490234375, -0.41574859619140625, -0.4040069580078125, -0.39226531982421875, -0.380523681640625, -0.36878204345703125, -0.3570404052734375, -0.34529876708984375, -0.33355712890625, -0.32181549072265625, -0.3100738525390625, -0.29833221435546875, -0.286590576171875, -0.27484893798828125, -0.2631072998046875, -0.25136566162109375, -0.2396240234375, -0.22788238525390625, -0.2161407470703125, -0.20439910888671875, -0.192657470703125, -0.18091583251953125, -0.1691741943359375, -0.15743255615234375, -0.14569091796875, -0.13394927978515625, -0.1222076416015625, -0.11046600341796875, -0.098724365234375, -0.08698272705078125, -0.0752410888671875, -0.06349945068359375, -0.0517578125, -0.04001617431640625, -0.0282745361328125, -0.01653289794921875, -0.004791259765625, 0.00695037841796875, 0.0186920166015625, 0.03043365478515625, 0.04217529296875, 0.05391693115234375, 0.0656585693359375, 0.07740020751953125, 0.089141845703125, 0.10088348388671875, 0.1126251220703125, 0.12436676025390625, 0.1361083984375, 0.14785003662109375, 0.1595916748046875, 0.17133331298828125, 0.183074951171875, 0.19481658935546875, 0.2065582275390625, 0.21829986572265625, 0.23004150390625, 0.24178314208984375, 0.2535247802734375, 0.26526641845703125, 0.277008056640625, 0.28874969482421875, 0.3004913330078125, 0.31223297119140625, 0.323974609375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 2.0, 7.0, 4.0, 11.0, 9.0, 11.0, 7.0, 16.0, 20.0, 20.0, 26.0, 40.0, 65.0, 78.0, 125.0, 134.0, 116.0, 73.0, 45.0, 44.0, 29.0, 20.0, 22.0, 18.0, 14.0, 12.0, 9.0, 8.0, 2.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00011581182479858398, -0.00011294335126876831, -0.00011007487773895264, -0.00010720640420913696, -0.00010433793067932129, -0.00010146945714950562, -9.860098361968994e-05, -9.573251008987427e-05, -9.28640365600586e-05, -8.999556303024292e-05, -8.712708950042725e-05, -8.425861597061157e-05, -8.13901424407959e-05, -7.852166891098022e-05, -7.565319538116455e-05, -7.278472185134888e-05, -6.99162483215332e-05, -6.704777479171753e-05, -6.417930126190186e-05, -6.131082773208618e-05, -5.844235420227051e-05, -5.5573880672454834e-05, -5.270540714263916e-05, -4.9836933612823486e-05, -4.696846008300781e-05, -4.409998655319214e-05, -4.1231513023376465e-05, -3.836303949356079e-05, -3.549456596374512e-05, -3.262609243392944e-05, -2.975761890411377e-05, -2.6889145374298096e-05, -2.4020671844482422e-05, -2.1152198314666748e-05, -1.8283724784851074e-05, -1.54152512550354e-05, -1.2546777725219727e-05, -9.678304195404053e-06, -6.809830665588379e-06, -3.941357135772705e-06, -1.0728836059570312e-06, 1.7955899238586426e-06, 4.664063453674316e-06, 7.53253698348999e-06, 1.0401010513305664e-05, 1.3269484043121338e-05, 1.6137957572937012e-05, 1.9006431102752686e-05, 2.187490463256836e-05, 2.4743378162384033e-05, 2.7611851692199707e-05, 3.048032522201538e-05, 3.3348798751831055e-05, 3.621727228164673e-05, 3.90857458114624e-05, 4.1954219341278076e-05, 4.482269287109375e-05, 4.7691166400909424e-05, 5.05596399307251e-05, 5.342811346054077e-05, 5.6296586990356445e-05, 5.916506052017212e-05, 6.203353404998779e-05, 6.490200757980347e-05, 6.777048110961914e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 5.0, 6.0, 7.0, 8.0, 9.0, 15.0, 44.0, 104.0, 321.0, 1030.0, 4782.0, 58098.0, 876229.0, 99484.0, 6535.0, 1275.0, 367.0, 121.0, 57.0, 19.0, 14.0, 15.0, 7.0, 6.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2401123046875, -0.23296165466308594, -0.22581100463867188, -0.2186603546142578, -0.21150970458984375, -0.2043590545654297, -0.19720840454101562, -0.19005775451660156, -0.1829071044921875, -0.17575645446777344, -0.16860580444335938, -0.1614551544189453, -0.15430450439453125, -0.1471538543701172, -0.14000320434570312, -0.13285255432128906, -0.125701904296875, -0.11855125427246094, -0.11140060424804688, -0.10424995422363281, -0.09709930419921875, -0.08994865417480469, -0.08279800415039062, -0.07564735412597656, -0.0684967041015625, -0.06134605407714844, -0.054195404052734375, -0.04704475402832031, -0.03989410400390625, -0.03274345397949219, -0.025592803955078125, -0.018442153930664062, -0.01129150390625, -0.0041408538818359375, 0.003009796142578125, 0.010160446166992188, 0.01731109619140625, 0.024461746215820312, 0.031612396240234375, 0.03876304626464844, 0.0459136962890625, 0.05306434631347656, 0.060214996337890625, 0.06736564636230469, 0.07451629638671875, 0.08166694641113281, 0.08881759643554688, 0.09596824645996094, 0.103118896484375, 0.11026954650878906, 0.11742019653320312, 0.12457084655761719, 0.13172149658203125, 0.1388721466064453, 0.14602279663085938, 0.15317344665527344, 0.1603240966796875, 0.16747474670410156, 0.17462539672851562, 0.1817760467529297, 0.18892669677734375, 0.1960773468017578, 0.20322799682617188, 0.21037864685058594, 0.217529296875]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 3.0, 3.0, 2.0, 6.0, 8.0, 11.0, 7.0, 11.0, 26.0, 34.0, 46.0, 62.0, 67.0, 73.0, 101.0, 107.0, 77.0, 80.0, 59.0, 51.0, 41.0, 25.0, 26.0, 17.0, 12.0, 10.0, 11.0, 8.0, 4.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0924072265625, -0.08945274353027344, -0.08649826049804688, -0.08354377746582031, -0.08058929443359375, -0.07763481140136719, -0.07468032836914062, -0.07172584533691406, -0.0687713623046875, -0.06581687927246094, -0.06286239624023438, -0.05990791320800781, -0.05695343017578125, -0.05399894714355469, -0.051044464111328125, -0.04808998107910156, -0.045135498046875, -0.04218101501464844, -0.039226531982421875, -0.03627204895019531, -0.03331756591796875, -0.030363082885742188, -0.027408599853515625, -0.024454116821289062, -0.0214996337890625, -0.018545150756835938, -0.015590667724609375, -0.012636184692382812, -0.00968170166015625, -0.0067272186279296875, -0.003772735595703125, -0.0008182525634765625, 0.00213623046875, 0.0050907135009765625, 0.008045196533203125, 0.010999679565429688, 0.01395416259765625, 0.016908645629882812, 0.019863128662109375, 0.022817611694335938, 0.0257720947265625, 0.028726577758789062, 0.031681060791015625, 0.03463554382324219, 0.03759002685546875, 0.04054450988769531, 0.043498992919921875, 0.04645347595214844, 0.049407958984375, 0.05236244201660156, 0.055316925048828125, 0.05827140808105469, 0.06122589111328125, 0.06418037414550781, 0.06713485717773438, 0.07008934020996094, 0.0730438232421875, 0.07599830627441406, 0.07895278930664062, 0.08190727233886719, 0.08486175537109375, 0.08781623840332031, 0.09077072143554688, 0.09372520446777344, 0.0966796875]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 2.0, 6.0, 10.0, 10.0, 9.0, 23.0, 25.0, 48.0, 60.0, 108.0, 135.0, 175.0, 141.0, 87.0, 55.0, 38.0, 24.0, 14.0, 16.0, 2.0, 7.0, 4.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-2.293674945831299, -2.240849256515503, -2.188023328781128, -2.135197639465332, -2.082371950149536, -2.029546022415161, -1.9767203330993652, -1.9238945245742798, -1.8710687160491943, -1.8182429075241089, -1.765417218208313, -1.7125914096832275, -1.659765601158142, -1.6069397926330566, -1.5541141033172607, -1.5012882947921753, -1.4484626054763794, -1.395636796951294, -1.342811107635498, -1.2899852991104126, -1.2371594905853271, -1.1843338012695312, -1.1315079927444458, -1.0786821842193604, -1.0258564949035645, -0.9730307459831238, -0.9202049374580383, -0.8673791885375977, -0.8145533800125122, -0.7617276310920715, -0.7089018821716309, -0.6560760736465454, -0.60325026512146, -0.5504245162010193, -0.49759870767593384, -0.44477295875549316, -0.3919471800327301, -0.33912140130996704, -0.28629565238952637, -0.2334698736667633, -0.18064409494400024, -0.12781831622123718, -0.07499255239963531, -0.022166788578033447, 0.030658990144729614, 0.08348476886749268, 0.13631051778793335, 0.1891362965106964, 0.24196207523345947, 0.29478785395622253, 0.3476136326789856, 0.40043938159942627, 0.45326516032218933, 0.5060909390449524, 0.5589166879653931, 0.6117424964904785, 0.6645682454109192, 0.7173939943313599, 0.7702198028564453, 0.823045551776886, 0.8758713006973267, 0.9286971092224121, 0.9815228581428528, 1.0343486070632935, 1.087174415588379]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 7.0, 6.0, 14.0, 19.0, 22.0, 15.0, 24.0, 36.0, 37.0, 46.0, 37.0, 49.0, 54.0, 70.0, 56.0, 51.0, 68.0, 49.0, 58.0, 40.0, 43.0, 41.0, 28.0, 28.0, 29.0, 21.0, 14.0, 13.0, 6.0, 4.0, 4.0, 8.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5013625621795654, -2.4256365299224854, -2.3499104976654053, -2.2741847038269043, -2.198458671569824, -2.122732639312744, -2.047006607055664, -1.971280574798584, -1.8955546617507935, -1.8198286294937134, -1.7441027164459229, -1.6683766841888428, -1.5926506519317627, -1.5169247388839722, -1.441198706626892, -1.3654727935791016, -1.2897467613220215, -1.2140207290649414, -1.1382948160171509, -1.0625687837600708, -0.9868428111076355, -0.9111168384552002, -0.8353908061981201, -0.7596648335456848, -0.6839388608932495, -0.6082128882408142, -0.5324869155883789, -0.45676088333129883, -0.3810349106788635, -0.3053089380264282, -0.22958293557167053, -0.15385693311691284, -0.07813096046447754, -0.0024049729108810425, 0.07332101464271545, 0.14904700219631195, 0.22477298974990845, 0.30049896240234375, 0.37622496485710144, 0.45195096731185913, 0.5276769399642944, 0.6034029126167297, 0.679128885269165, 0.7548549175262451, 0.8305808901786804, 0.9063068628311157, 0.9820328950881958, 1.0577588081359863, 1.1334848403930664, 1.2092108726501465, 1.284936785697937, 1.360662817955017, 1.4363887310028076, 1.5121147632598877, 1.5878407955169678, 1.6635668277740479, 1.7392927408218384, 1.8150187730789185, 1.890744686126709, 1.966470718383789, 2.042196750640869, 2.117922782897949, 2.19364857673645, 2.2693746089935303, 2.3451006412506104]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 2.0, 9.0, 10.0, 11.0, 23.0, 38.0, 64.0, 100.0, 178.0, 323.0, 536.0, 1231.0, 2860.0, 9694.0, 53355.0, 3742556.0, 350587.0, 23317.0, 5555.0, 1963.0, 825.0, 375.0, 262.0, 144.0, 77.0, 54.0, 45.0, 23.0, 17.0, 16.0, 8.0, 7.0, 4.0, 4.0, 4.0, 5.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4013671875, -0.3883323669433594, -0.37529754638671875, -0.3622627258300781, -0.3492279052734375, -0.3361930847167969, -0.32315826416015625, -0.3101234436035156, -0.297088623046875, -0.2840538024902344, -0.27101898193359375, -0.2579841613769531, -0.2449493408203125, -0.23191452026367188, -0.21887969970703125, -0.20584487915039062, -0.19281005859375, -0.17977523803710938, -0.16674041748046875, -0.15370559692382812, -0.1406707763671875, -0.12763595581054688, -0.11460113525390625, -0.10156631469726562, -0.088531494140625, -0.07549667358398438, -0.06246185302734375, -0.049427032470703125, -0.0363922119140625, -0.023357391357421875, -0.01032257080078125, 0.002712249755859375, 0.0157470703125, 0.028781890869140625, 0.04181671142578125, 0.054851531982421875, 0.0678863525390625, 0.08092117309570312, 0.09395599365234375, 0.10699081420898438, 0.120025634765625, 0.13306045532226562, 0.14609527587890625, 0.15913009643554688, 0.1721649169921875, 0.18519973754882812, 0.19823455810546875, 0.21126937866210938, 0.22430419921875, 0.23733901977539062, 0.25037384033203125, 0.2634086608886719, 0.2764434814453125, 0.2894783020019531, 0.30251312255859375, 0.3155479431152344, 0.328582763671875, 0.3416175842285156, 0.35465240478515625, 0.3676872253417969, 0.3807220458984375, 0.3937568664550781, 0.40679168701171875, 0.4198265075683594, 0.432861328125]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 4.0, 6.0, 10.0, 11.0, 15.0, 41.0, 43.0, 72.0, 68.0, 85.0, 122.0, 108.0, 102.0, 91.0, 63.0, 52.0, 37.0, 25.0, 16.0, 4.0, 6.0, 4.0, 5.0, 6.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11700439453125, -0.11195659637451172, -0.10690879821777344, -0.10186100006103516, -0.09681320190429688, -0.0917654037475586, -0.08671760559082031, -0.08166980743408203, -0.07662200927734375, -0.07157421112060547, -0.06652641296386719, -0.061478614807128906, -0.056430816650390625, -0.051383018493652344, -0.04633522033691406, -0.04128742218017578, -0.0362396240234375, -0.03119182586669922, -0.026144027709960938, -0.021096229553222656, -0.016048431396484375, -0.011000633239746094, -0.0059528350830078125, -0.0009050369262695312, 0.00414276123046875, 0.009190559387207031, 0.014238357543945312, 0.019286155700683594, 0.024333953857421875, 0.029381752014160156, 0.03442955017089844, 0.03947734832763672, 0.044525146484375, 0.04957294464111328, 0.05462074279785156, 0.059668540954589844, 0.06471633911132812, 0.0697641372680664, 0.07481193542480469, 0.07985973358154297, 0.08490753173828125, 0.08995532989501953, 0.09500312805175781, 0.1000509262084961, 0.10509872436523438, 0.11014652252197266, 0.11519432067871094, 0.12024211883544922, 0.1252899169921875, 0.13033771514892578, 0.13538551330566406, 0.14043331146240234, 0.14548110961914062, 0.1505289077758789, 0.1555767059326172, 0.16062450408935547, 0.16567230224609375, 0.17072010040283203, 0.1757678985595703, 0.1808156967163086, 0.18586349487304688, 0.19091129302978516, 0.19595909118652344, 0.20100688934326172, 0.2060546875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 3.0, 7.0, 12.0, 23.0, 15.0, 35.0, 54.0, 88.0, 162.0, 272.0, 498.0, 1023.0, 2611.0, 8841.0, 53413.0, 2214403.0, 1850058.0, 49405.0, 8456.0, 2551.0, 1006.0, 524.0, 289.0, 189.0, 128.0, 75.0, 52.0, 22.0, 23.0, 14.0, 8.0, 10.0, 3.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.23583984375, -0.22676467895507812, -0.21768951416015625, -0.20861434936523438, -0.1995391845703125, -0.19046401977539062, -0.18138885498046875, -0.17231369018554688, -0.163238525390625, -0.15416336059570312, -0.14508819580078125, -0.13601303100585938, -0.1269378662109375, -0.11786270141601562, -0.10878753662109375, -0.09971237182617188, -0.09063720703125, -0.08156204223632812, -0.07248687744140625, -0.06341171264648438, -0.0543365478515625, -0.045261383056640625, -0.03618621826171875, -0.027111053466796875, -0.018035888671875, -0.008960723876953125, 0.00011444091796875, 0.009189605712890625, 0.0182647705078125, 0.027339935302734375, 0.03641510009765625, 0.045490264892578125, 0.0545654296875, 0.06364059448242188, 0.07271575927734375, 0.08179092407226562, 0.0908660888671875, 0.09994125366210938, 0.10901641845703125, 0.11809158325195312, 0.127166748046875, 0.13624191284179688, 0.14531707763671875, 0.15439224243164062, 0.1634674072265625, 0.17254257202148438, 0.18161773681640625, 0.19069290161132812, 0.19976806640625, 0.20884323120117188, 0.21791839599609375, 0.22699356079101562, 0.2360687255859375, 0.24514389038085938, 0.25421905517578125, 0.2632942199707031, 0.272369384765625, 0.2814445495605469, 0.29051971435546875, 0.2995948791503906, 0.3086700439453125, 0.3177452087402344, 0.32682037353515625, 0.3358955383300781, 0.344970703125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 4.0, 6.0, 8.0, 14.0, 14.0, 22.0, 27.0, 57.0, 107.0, 238.0, 748.0, 1904.0, 540.0, 188.0, 83.0, 48.0, 22.0, 19.0, 9.0, 6.0, 3.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08050537109375, -0.07655048370361328, -0.07259559631347656, -0.06864070892333984, -0.06468582153320312, -0.060730934143066406, -0.05677604675292969, -0.05282115936279297, -0.04886627197265625, -0.04491138458251953, -0.04095649719238281, -0.037001609802246094, -0.033046722412109375, -0.029091835021972656, -0.025136947631835938, -0.02118206024169922, -0.0172271728515625, -0.013272285461425781, -0.009317398071289062, -0.005362510681152344, -0.001407623291015625, 0.0025472640991210938, 0.0065021514892578125, 0.010457038879394531, 0.01441192626953125, 0.01836681365966797, 0.022321701049804688, 0.026276588439941406, 0.030231475830078125, 0.034186363220214844, 0.03814125061035156, 0.04209613800048828, 0.046051025390625, 0.05000591278076172, 0.05396080017089844, 0.057915687561035156, 0.061870574951171875, 0.0658254623413086, 0.06978034973144531, 0.07373523712158203, 0.07769012451171875, 0.08164501190185547, 0.08559989929199219, 0.0895547866821289, 0.09350967407226562, 0.09746456146240234, 0.10141944885253906, 0.10537433624267578, 0.1093292236328125, 0.11328411102294922, 0.11723899841308594, 0.12119388580322266, 0.12514877319335938, 0.1291036605834961, 0.1330585479736328, 0.13701343536376953, 0.14096832275390625, 0.14492321014404297, 0.1488780975341797, 0.1528329849243164, 0.15678787231445312, 0.16074275970458984, 0.16469764709472656, 0.16865253448486328, 0.172607421875]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 7.0, 12.0, 37.0, 121.0, 254.0, 285.0, 174.0, 79.0, 25.0, 7.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6286548376083374, -0.6005786657333374, -0.5725024938583374, -0.5444262623786926, -0.5163500905036926, -0.4882739186286926, -0.46019771695137024, -0.43212151527404785, -0.40404534339904785, -0.37596917152404785, -0.34789296984672546, -0.3198167681694031, -0.2917405962944031, -0.2636644244194031, -0.2355882227420807, -0.2075120359659195, -0.1794358491897583, -0.1513596624135971, -0.12328347563743591, -0.09520728886127472, -0.06713110208511353, -0.03905491530895233, -0.010978728532791138, 0.017097458243370056, 0.04517364501953125, 0.07324983179569244, 0.10132601857185364, 0.12940220534801483, 0.15747839212417603, 0.18555457890033722, 0.2136307656764984, 0.2417069524526596, 0.2697831392288208, 0.2978593111038208, 0.3259355127811432, 0.3540117144584656, 0.3820878863334656, 0.4101640582084656, 0.43824025988578796, 0.46631646156311035, 0.49439263343811035, 0.5224688053131104, 0.5505449771881104, 0.5786212086677551, 0.6066973805427551, 0.6347735524177551, 0.6628497838973999, 0.6909259557723999, 0.7190021276473999, 0.7470782995223999, 0.7751544713973999, 0.8032307028770447, 0.8313068747520447, 0.8593830466270447, 0.8874592781066895, 0.9155354499816895, 0.9436116218566895, 0.9716877937316895, 0.9997639656066895, 1.0278401374816895, 1.0559163093566895, 1.083992600440979, 1.112068772315979, 1.140144944190979, 1.168221116065979]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 3.0, 10.0, 10.0, 10.0, 13.0, 14.0, 13.0, 28.0, 47.0, 31.0, 46.0, 39.0, 42.0, 60.0, 46.0, 55.0, 45.0, 46.0, 55.0, 66.0, 56.0, 51.0, 34.0, 30.0, 39.0, 16.0, 23.0, 20.0, 9.0, 10.0, 8.0, 6.0, 3.0, 5.0, 3.0, 4.0, 2.0, 4.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.40505343675613403, -0.3944965600967407, -0.3839397132396698, -0.3733828365802765, -0.3628259599208832, -0.35226911306381226, -0.34171223640441895, -0.33115535974502563, -0.3205984830856323, -0.310041606426239, -0.2994847595691681, -0.2889278829097748, -0.27837100625038147, -0.26781415939331055, -0.25725728273391724, -0.24670040607452393, -0.236143559217453, -0.2255866974592209, -0.21502982079982758, -0.20447295904159546, -0.19391608238220215, -0.18335922062397003, -0.17280235886573792, -0.1622454822063446, -0.1516886204481125, -0.14113175868988037, -0.13057488203048706, -0.12001802027225494, -0.10946115106344223, -0.09890428185462952, -0.0883474200963974, -0.07779055088758469, -0.06723368167877197, -0.05667681246995926, -0.046119946986436844, -0.03556308150291443, -0.025006212294101715, -0.014449343085289001, -0.0038924813270568848, 0.006664387881755829, 0.017221257090568542, 0.027778124436736107, 0.03833499178290367, 0.048891857266426086, 0.0594487264752388, 0.07000559568405151, 0.08056245744228363, 0.09111932665109634, 0.10167619585990906, 0.11223306506872177, 0.12278993427753448, 0.1333467960357666, 0.1439036726951599, 0.15446053445339203, 0.16501739621162415, 0.17557427287101746, 0.18613113462924957, 0.1966879963874817, 0.207244873046875, 0.21780173480510712, 0.22835859656333923, 0.23891547322273254, 0.24947233498096466, 0.2600291967391968, 0.2705860733985901]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 5.0, 12.0, 6.0, 12.0, 20.0, 29.0, 31.0, 38.0, 55.0, 83.0, 135.0, 185.0, 241.0, 410.0, 653.0, 1197.0, 2318.0, 5208.0, 12665.0, 41014.0, 172592.0, 518985.0, 216075.0, 49822.0, 15000.0, 5689.0, 2563.0, 1362.0, 810.0, 449.0, 294.0, 198.0, 106.0, 85.0, 59.0, 40.0, 24.0, 22.0, 15.0, 8.0, 7.0, 9.0, 6.0, 9.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.3349609375, -0.3243522644042969, -0.31374359130859375, -0.3031349182128906, -0.2925262451171875, -0.2819175720214844, -0.27130889892578125, -0.2607002258300781, -0.250091552734375, -0.23948287963867188, -0.22887420654296875, -0.21826553344726562, -0.2076568603515625, -0.19704818725585938, -0.18643951416015625, -0.17583084106445312, -0.16522216796875, -0.15461349487304688, -0.14400482177734375, -0.13339614868164062, -0.1227874755859375, -0.11217880249023438, -0.10157012939453125, -0.09096145629882812, -0.080352783203125, -0.06974411010742188, -0.05913543701171875, -0.048526763916015625, -0.0379180908203125, -0.027309417724609375, -0.01670074462890625, -0.006092071533203125, 0.0045166015625, 0.015125274658203125, 0.02573394775390625, 0.036342620849609375, 0.0469512939453125, 0.057559967041015625, 0.06816864013671875, 0.07877731323242188, 0.089385986328125, 0.09999465942382812, 0.11060333251953125, 0.12121200561523438, 0.1318206787109375, 0.14242935180664062, 0.15303802490234375, 0.16364669799804688, 0.17425537109375, 0.18486404418945312, 0.19547271728515625, 0.20608139038085938, 0.2166900634765625, 0.22729873657226562, 0.23790740966796875, 0.24851608276367188, 0.259124755859375, 0.2697334289550781, 0.28034210205078125, 0.2909507751464844, 0.3015594482421875, 0.3121681213378906, 0.32277679443359375, 0.3333854675292969, 0.343994140625]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 2.0, 11.0, 6.0, 20.0, 26.0, 40.0, 56.0, 67.0, 84.0, 105.0, 107.0, 113.0, 98.0, 76.0, 63.0, 42.0, 27.0, 19.0, 13.0, 4.0, 8.0, 1.0, 7.0, 1.0, 1.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.112548828125, -0.10758399963378906, -0.10261917114257812, -0.09765434265136719, -0.09268951416015625, -0.08772468566894531, -0.08275985717773438, -0.07779502868652344, -0.0728302001953125, -0.06786537170410156, -0.06290054321289062, -0.05793571472167969, -0.05297088623046875, -0.04800605773925781, -0.043041229248046875, -0.03807640075683594, -0.033111572265625, -0.028146743774414062, -0.023181915283203125, -0.018217086791992188, -0.01325225830078125, -0.008287429809570312, -0.003322601318359375, 0.0016422271728515625, 0.0066070556640625, 0.011571884155273438, 0.016536712646484375, 0.021501541137695312, 0.02646636962890625, 0.03143119812011719, 0.036396026611328125, 0.04136085510253906, 0.04632568359375, 0.05129051208496094, 0.056255340576171875, 0.06122016906738281, 0.06618499755859375, 0.07114982604980469, 0.07611465454101562, 0.08107948303222656, 0.0860443115234375, 0.09100914001464844, 0.09597396850585938, 0.10093879699707031, 0.10590362548828125, 0.11086845397949219, 0.11583328247070312, 0.12079811096191406, 0.125762939453125, 0.13072776794433594, 0.13569259643554688, 0.1406574249267578, 0.14562225341796875, 0.1505870819091797, 0.15555191040039062, 0.16051673889160156, 0.1654815673828125, 0.17044639587402344, 0.17541122436523438, 0.1803760528564453, 0.18534088134765625, 0.1903057098388672, 0.19527053833007812, 0.20023536682128906, 0.2052001953125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 2.0, 3.0, 5.0, 11.0, 10.0, 10.0, 18.0, 32.0, 30.0, 45.0, 65.0, 91.0, 156.0, 228.0, 413.0, 727.0, 1398.0, 2777.0, 6285.0, 14888.0, 39262.0, 121943.0, 351994.0, 334014.0, 112123.0, 36265.0, 13961.0, 5923.0, 2728.0, 1313.0, 723.0, 379.0, 245.0, 141.0, 102.0, 76.0, 46.0, 29.0, 31.0, 18.0, 19.0, 6.0, 8.0, 1.0, 6.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.22998046875, -0.22320938110351562, -0.21643829345703125, -0.20966720581054688, -0.2028961181640625, -0.19612503051757812, -0.18935394287109375, -0.18258285522460938, -0.175811767578125, -0.16904067993164062, -0.16226959228515625, -0.15549850463867188, -0.1487274169921875, -0.14195632934570312, -0.13518524169921875, -0.12841415405273438, -0.12164306640625, -0.11487197875976562, -0.10810089111328125, -0.10132980346679688, -0.0945587158203125, -0.08778762817382812, -0.08101654052734375, -0.07424545288085938, -0.067474365234375, -0.060703277587890625, -0.05393218994140625, -0.047161102294921875, -0.0403900146484375, -0.033618927001953125, -0.02684783935546875, -0.020076751708984375, -0.0133056640625, -0.006534576416015625, 0.00023651123046875, 0.007007598876953125, 0.0137786865234375, 0.020549774169921875, 0.02732086181640625, 0.034091949462890625, 0.040863037109375, 0.047634124755859375, 0.05440521240234375, 0.061176300048828125, 0.0679473876953125, 0.07471847534179688, 0.08148956298828125, 0.08826065063476562, 0.09503173828125, 0.10180282592773438, 0.10857391357421875, 0.11534500122070312, 0.1221160888671875, 0.12888717651367188, 0.13565826416015625, 0.14242935180664062, 0.149200439453125, 0.15597152709960938, 0.16274261474609375, 0.16951370239257812, 0.1762847900390625, 0.18305587768554688, 0.18982696533203125, 0.19659805297851562, 0.203369140625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 3.0, 9.0, 3.0, 10.0, 4.0, 8.0, 13.0, 11.0, 14.0, 18.0, 15.0, 15.0, 13.0, 27.0, 30.0, 28.0, 22.0, 33.0, 45.0, 39.0, 47.0, 41.0, 28.0, 46.0, 45.0, 32.0, 52.0, 44.0, 33.0, 33.0, 29.0, 37.0, 30.0, 22.0, 16.0, 17.0, 20.0, 18.0, 13.0, 5.0, 11.0, 6.0, 8.0, 2.0, 1.0, 5.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.309326171875, -0.299713134765625, -0.29010009765625, -0.280487060546875, -0.2708740234375, -0.261260986328125, -0.25164794921875, -0.242034912109375, -0.232421875, -0.222808837890625, -0.21319580078125, -0.203582763671875, -0.1939697265625, -0.184356689453125, -0.17474365234375, -0.165130615234375, -0.155517578125, -0.145904541015625, -0.13629150390625, -0.126678466796875, -0.1170654296875, -0.107452392578125, -0.09783935546875, -0.088226318359375, -0.07861328125, -0.069000244140625, -0.05938720703125, -0.049774169921875, -0.0401611328125, -0.030548095703125, -0.02093505859375, -0.011322021484375, -0.001708984375, 0.007904052734375, 0.01751708984375, 0.027130126953125, 0.0367431640625, 0.046356201171875, 0.05596923828125, 0.065582275390625, 0.0751953125, 0.084808349609375, 0.09442138671875, 0.104034423828125, 0.1136474609375, 0.123260498046875, 0.13287353515625, 0.142486572265625, 0.152099609375, 0.161712646484375, 0.17132568359375, 0.180938720703125, 0.1905517578125, 0.200164794921875, 0.20977783203125, 0.219390869140625, 0.22900390625, 0.238616943359375, 0.24822998046875, 0.257843017578125, 0.2674560546875, 0.277069091796875, 0.28668212890625, 0.296295166015625, 0.305908203125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 4.0, 5.0, 10.0, 34.0, 50.0, 95.0, 341.0, 1261.0, 6627.0, 94544.0, 857582.0, 80151.0, 6155.0, 1165.0, 311.0, 116.0, 54.0, 29.0, 6.0, 11.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.183837890625, -0.17714691162109375, -0.1704559326171875, -0.16376495361328125, -0.157073974609375, -0.15038299560546875, -0.1436920166015625, -0.13700103759765625, -0.13031005859375, -0.12361907958984375, -0.1169281005859375, -0.11023712158203125, -0.103546142578125, -0.09685516357421875, -0.0901641845703125, -0.08347320556640625, -0.0767822265625, -0.07009124755859375, -0.0634002685546875, -0.05670928955078125, -0.050018310546875, -0.04332733154296875, -0.0366363525390625, -0.02994537353515625, -0.02325439453125, -0.01656341552734375, -0.0098724365234375, -0.00318145751953125, 0.003509521484375, 0.01020050048828125, 0.0168914794921875, 0.02358245849609375, 0.0302734375, 0.03696441650390625, 0.0436553955078125, 0.05034637451171875, 0.057037353515625, 0.06372833251953125, 0.0704193115234375, 0.07711029052734375, 0.08380126953125, 0.09049224853515625, 0.0971832275390625, 0.10387420654296875, 0.110565185546875, 0.11725616455078125, 0.1239471435546875, 0.13063812255859375, 0.1373291015625, 0.14402008056640625, 0.1507110595703125, 0.15740203857421875, 0.164093017578125, 0.17078399658203125, 0.1774749755859375, 0.18416595458984375, 0.19085693359375, 0.19754791259765625, 0.2042388916015625, 0.21092987060546875, 0.217620849609375, 0.22431182861328125, 0.2310028076171875, 0.23769378662109375, 0.244384765625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 6.0, 3.0, 6.0, 9.0, 7.0, 6.0, 15.0, 10.0, 14.0, 12.0, 24.0, 18.0, 25.0, 34.0, 35.0, 60.0, 56.0, 78.0, 93.0, 100.0, 70.0, 50.0, 57.0, 39.0, 33.0, 25.0, 19.0, 15.0, 13.0, 21.0, 8.0, 8.0, 7.0, 8.0, 4.0, 4.0, 2.0, 7.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.969141006469727e-05, -7.726624608039856e-05, -7.484108209609985e-05, -7.241591811180115e-05, -6.999075412750244e-05, -6.756559014320374e-05, -6.514042615890503e-05, -6.271526217460632e-05, -6.029009819030762e-05, -5.786493420600891e-05, -5.5439770221710205e-05, -5.30146062374115e-05, -5.058944225311279e-05, -4.816427826881409e-05, -4.573911428451538e-05, -4.3313950300216675e-05, -4.088878631591797e-05, -3.846362233161926e-05, -3.603845834732056e-05, -3.361329436302185e-05, -3.1188130378723145e-05, -2.876296639442444e-05, -2.6337802410125732e-05, -2.3912638425827026e-05, -2.148747444152832e-05, -1.9062310457229614e-05, -1.6637146472930908e-05, -1.4211982488632202e-05, -1.1786818504333496e-05, -9.36165452003479e-06, -6.936490535736084e-06, -4.511326551437378e-06, -2.086162567138672e-06, 3.390014171600342e-07, 2.7641654014587402e-06, 5.189329385757446e-06, 7.614493370056152e-06, 1.0039657354354858e-05, 1.2464821338653564e-05, 1.488998532295227e-05, 1.7315149307250977e-05, 1.9740313291549683e-05, 2.216547727584839e-05, 2.4590641260147095e-05, 2.70158052444458e-05, 2.9440969228744507e-05, 3.186613321304321e-05, 3.429129719734192e-05, 3.6716461181640625e-05, 3.914162516593933e-05, 4.156678915023804e-05, 4.399195313453674e-05, 4.641711711883545e-05, 4.8842281103134155e-05, 5.126744508743286e-05, 5.369260907173157e-05, 5.6117773056030273e-05, 5.854293704032898e-05, 6.0968101024627686e-05, 6.339326500892639e-05, 6.58184289932251e-05, 6.82435929775238e-05, 7.066875696182251e-05, 7.309392094612122e-05, 7.551908493041992e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 3.0, 2.0, 2.0, 9.0, 10.0, 13.0, 27.0, 46.0, 82.0, 122.0, 258.0, 517.0, 1359.0, 4766.0, 26534.0, 272837.0, 663107.0, 65724.0, 9391.0, 2250.0, 769.0, 338.0, 171.0, 70.0, 46.0, 38.0, 17.0, 19.0, 9.0, 6.0, 8.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1719970703125, -0.16681861877441406, -0.16164016723632812, -0.1564617156982422, -0.15128326416015625, -0.1461048126220703, -0.14092636108398438, -0.13574790954589844, -0.1305694580078125, -0.12539100646972656, -0.12021255493164062, -0.11503410339355469, -0.10985565185546875, -0.10467720031738281, -0.09949874877929688, -0.09432029724121094, -0.089141845703125, -0.08396339416503906, -0.07878494262695312, -0.07360649108886719, -0.06842803955078125, -0.06324958801269531, -0.058071136474609375, -0.05289268493652344, -0.0477142333984375, -0.04253578186035156, -0.037357330322265625, -0.03217887878417969, -0.02700042724609375, -0.021821975708007812, -0.016643524169921875, -0.011465072631835938, -0.00628662109375, -0.0011081695556640625, 0.004070281982421875, 0.009248733520507812, 0.01442718505859375, 0.019605636596679688, 0.024784088134765625, 0.029962539672851562, 0.0351409912109375, 0.04031944274902344, 0.045497894287109375, 0.05067634582519531, 0.05585479736328125, 0.06103324890136719, 0.06621170043945312, 0.07139015197753906, 0.076568603515625, 0.08174705505371094, 0.08692550659179688, 0.09210395812988281, 0.09728240966796875, 0.10246086120605469, 0.10763931274414062, 0.11281776428222656, 0.1179962158203125, 0.12317466735839844, 0.12835311889648438, 0.1335315704345703, 0.13871002197265625, 0.1438884735107422, 0.14906692504882812, 0.15424537658691406, 0.159423828125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 4.0, 5.0, 5.0, 8.0, 14.0, 22.0, 23.0, 34.0, 48.0, 61.0, 97.0, 93.0, 122.0, 130.0, 93.0, 65.0, 53.0, 38.0, 28.0, 16.0, 20.0, 11.0, 5.0, 3.0, 4.0, 3.0, 2.0, 3.0], "bins": [-0.209716796875, -0.2054119110107422, -0.20110702514648438, -0.19680213928222656, -0.19249725341796875, -0.18819236755371094, -0.18388748168945312, -0.1795825958251953, -0.1752777099609375, -0.1709728240966797, -0.16666793823242188, -0.16236305236816406, -0.15805816650390625, -0.15375328063964844, -0.14944839477539062, -0.1451435089111328, -0.140838623046875, -0.1365337371826172, -0.13222885131835938, -0.12792396545410156, -0.12361907958984375, -0.11931419372558594, -0.11500930786132812, -0.11070442199707031, -0.1063995361328125, -0.10209465026855469, -0.09778976440429688, -0.09348487854003906, -0.08917999267578125, -0.08487510681152344, -0.08057022094726562, -0.07626533508300781, -0.07196044921875, -0.06765556335449219, -0.06335067749023438, -0.05904579162597656, -0.05474090576171875, -0.05043601989746094, -0.046131134033203125, -0.04182624816894531, -0.0375213623046875, -0.03321647644042969, -0.028911590576171875, -0.024606704711914062, -0.02030181884765625, -0.015996932983398438, -0.011692047119140625, -0.0073871612548828125, -0.003082275390625, 0.0012226104736328125, 0.005527496337890625, 0.009832382202148438, 0.01413726806640625, 0.018442153930664062, 0.022747039794921875, 0.027051925659179688, 0.0313568115234375, 0.03566169738769531, 0.039966583251953125, 0.04427146911621094, 0.04857635498046875, 0.05288124084472656, 0.057186126708984375, 0.06149101257324219, 0.0657958984375]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 5.0, 5.0, 4.0, 8.0, 10.0, 19.0, 32.0, 44.0, 72.0, 117.0, 148.0, 148.0, 140.0, 95.0, 63.0, 43.0, 18.0, 15.0, 10.0, 3.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2023637294769287, -1.142227292060852, -1.082090973854065, -1.0219545364379883, -0.9618180990219116, -0.9016817212104797, -0.8415453433990479, -0.7814089059829712, -0.7212724685668945, -0.6611360907554626, -0.600999653339386, -0.5408632755279541, -0.48072683811187744, -0.42059046030044556, -0.3604540526866913, -0.300317645072937, -0.24018126726150513, -0.18004485964775085, -0.11990845948457718, -0.0597720593214035, 0.00036434829235076904, 0.06050074100494385, 0.12063714861869812, 0.1807735562324524, 0.24090996384620667, 0.30104637145996094, 0.3611827790737152, 0.4213191866874695, 0.48145556449890137, 0.541592001914978, 0.6017283797264099, 0.6618647575378418, 0.7220011949539185, 0.7821375727653503, 0.842274010181427, 0.9024103879928589, 0.9625468254089355, 1.0226831436157227, 1.0828195810317993, 1.142956018447876, 1.2030924558639526, 1.2632288932800293, 1.3233652114868164, 1.383501648902893, 1.4436380863189697, 1.5037744045257568, 1.5639108419418335, 1.6240472793579102, 1.6841835975646973, 1.744320034980774, 1.804456353187561, 1.8645927906036377, 1.9247292280197144, 1.984865665435791, 2.045001983642578, 2.1051383018493652, 2.1652748584747314, 2.2254111766815186, 2.2855477333068848, 2.345684051513672, 2.405820369720459, 2.465956926345825, 2.5260932445526123, 2.5862298011779785, 2.6463661193847656]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 7.0, 6.0, 11.0, 10.0, 4.0, 7.0, 9.0, 19.0, 20.0, 22.0, 16.0, 25.0, 38.0, 34.0, 30.0, 49.0, 47.0, 32.0, 56.0, 45.0, 33.0, 40.0, 44.0, 39.0, 47.0, 39.0, 41.0, 26.0, 18.0, 35.0, 25.0, 20.0, 22.0, 13.0, 19.0, 7.0, 12.0, 7.0, 7.0, 10.0, 6.0, 3.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8370895385742188, -1.7772239446640015, -1.7173584699630737, -1.6574928760528564, -1.5976274013519287, -1.5377618074417114, -1.4778962135314941, -1.4180307388305664, -1.3581651449203491, -1.2982995510101318, -1.238434076309204, -1.1785684823989868, -1.118703007698059, -1.0588374137878418, -0.9989718794822693, -0.9391063451766968, -0.8792408108711243, -0.8193752765655518, -0.7595097422599792, -0.6996442079544067, -0.6397786140441895, -0.5799130797386169, -0.5200475454330444, -0.46018198132514954, -0.400316447019577, -0.3404509127140045, -0.2805853486061096, -0.2207198143005371, -0.1608542650938034, -0.1009887158870697, -0.04112318158149719, 0.018742382526397705, 0.07860791683197021, 0.13847346603870392, 0.19833901524543762, 0.25820454955101013, 0.31807011365890503, 0.37793564796447754, 0.43780118227005005, 0.49766674637794495, 0.5575323104858398, 0.6173978447914124, 0.6772633790969849, 0.7371289730072021, 0.7969945073127747, 0.8568600416183472, 0.9167255759239197, 0.9765911102294922, 1.03645658493042, 1.0963221788406372, 1.156187653541565, 1.2160532474517822, 1.27591872215271, 1.3357843160629272, 1.3956499099731445, 1.4555153846740723, 1.5153809785842896, 1.5752465724945068, 1.6351120471954346, 1.6949776411056519, 1.7548431158065796, 1.8147087097167969, 1.8745741844177246, 1.934439778327942, 1.9943053722381592]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 5.0, 4.0, 3.0, 8.0, 11.0, 17.0, 27.0, 44.0, 91.0, 138.0, 226.0, 395.0, 775.0, 1529.0, 3807.0, 13403.0, 85896.0, 3851177.0, 206959.0, 20638.0, 5226.0, 1897.0, 853.0, 451.0, 248.0, 152.0, 84.0, 54.0, 51.0, 26.0, 28.0, 14.0, 12.0, 10.0, 7.0, 2.0, 6.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.313720703125, -0.3009910583496094, -0.28826141357421875, -0.2755317687988281, -0.2628021240234375, -0.2500724792480469, -0.23734283447265625, -0.22461318969726562, -0.211883544921875, -0.19915390014648438, -0.18642425537109375, -0.17369461059570312, -0.1609649658203125, -0.14823532104492188, -0.13550567626953125, -0.12277603149414062, -0.11004638671875, -0.09731674194335938, -0.08458709716796875, -0.07185745239257812, -0.0591278076171875, -0.046398162841796875, -0.03366851806640625, -0.020938873291015625, -0.008209228515625, 0.004520416259765625, 0.01725006103515625, 0.029979705810546875, 0.0427093505859375, 0.055438995361328125, 0.06816864013671875, 0.08089828491210938, 0.0936279296875, 0.10635757446289062, 0.11908721923828125, 0.13181686401367188, 0.1445465087890625, 0.15727615356445312, 0.17000579833984375, 0.18273544311523438, 0.195465087890625, 0.20819473266601562, 0.22092437744140625, 0.23365402221679688, 0.2463836669921875, 0.2591133117675781, 0.27184295654296875, 0.2845726013183594, 0.29730224609375, 0.3100318908691406, 0.32276153564453125, 0.3354911804199219, 0.3482208251953125, 0.3609504699707031, 0.37368011474609375, 0.3864097595214844, 0.399139404296875, 0.4118690490722656, 0.42459869384765625, 0.4373283386230469, 0.4500579833984375, 0.4627876281738281, 0.47551727294921875, 0.4882469177246094, 0.5009765625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 2.0, 6.0, 7.0, 10.0, 20.0, 21.0, 43.0, 55.0, 65.0, 67.0, 92.0, 110.0, 110.0, 94.0, 75.0, 67.0, 43.0, 33.0, 26.0, 21.0, 9.0, 6.0, 4.0, 8.0, 3.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.119873046875, -0.11465072631835938, -0.10942840576171875, -0.10420608520507812, -0.0989837646484375, -0.09376144409179688, -0.08853912353515625, -0.08331680297851562, -0.078094482421875, -0.07287216186523438, -0.06764984130859375, -0.062427520751953125, -0.0572052001953125, -0.051982879638671875, -0.04676055908203125, -0.041538238525390625, -0.03631591796875, -0.031093597412109375, -0.02587127685546875, -0.020648956298828125, -0.0154266357421875, -0.010204315185546875, -0.00498199462890625, 0.000240325927734375, 0.005462646484375, 0.010684967041015625, 0.01590728759765625, 0.021129608154296875, 0.0263519287109375, 0.031574249267578125, 0.03679656982421875, 0.042018890380859375, 0.0472412109375, 0.052463531494140625, 0.05768585205078125, 0.06290817260742188, 0.0681304931640625, 0.07335281372070312, 0.07857513427734375, 0.08379745483398438, 0.089019775390625, 0.09424209594726562, 0.09946441650390625, 0.10468673706054688, 0.1099090576171875, 0.11513137817382812, 0.12035369873046875, 0.12557601928710938, 0.13079833984375, 0.13602066040039062, 0.14124298095703125, 0.14646530151367188, 0.1516876220703125, 0.15690994262695312, 0.16213226318359375, 0.16735458374023438, 0.172576904296875, 0.17779922485351562, 0.18302154541015625, 0.18824386596679688, 0.1934661865234375, 0.19868850708007812, 0.20391082763671875, 0.20913314819335938, 0.21435546875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 11.0, 12.0, 19.0, 35.0, 67.0, 135.0, 242.0, 536.0, 1158.0, 2605.0, 6963.0, 31351.0, 397783.0, 3596363.0, 131971.0, 16923.0, 4658.0, 1768.0, 861.0, 409.0, 193.0, 109.0, 46.0, 28.0, 13.0, 14.0, 3.0, 6.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.23974609375, -0.23157119750976562, -0.22339630126953125, -0.21522140502929688, -0.2070465087890625, -0.19887161254882812, -0.19069671630859375, -0.18252182006835938, -0.174346923828125, -0.16617202758789062, -0.15799713134765625, -0.14982223510742188, -0.1416473388671875, -0.13347244262695312, -0.12529754638671875, -0.11712265014648438, -0.10894775390625, -0.10077285766601562, -0.09259796142578125, -0.08442306518554688, -0.0762481689453125, -0.06807327270507812, -0.05989837646484375, -0.051723480224609375, -0.043548583984375, -0.035373687744140625, -0.02719879150390625, -0.019023895263671875, -0.0108489990234375, -0.002674102783203125, 0.00550079345703125, 0.013675689697265625, 0.0218505859375, 0.030025482177734375, 0.03820037841796875, 0.046375274658203125, 0.0545501708984375, 0.06272506713867188, 0.07089996337890625, 0.07907485961914062, 0.087249755859375, 0.09542465209960938, 0.10359954833984375, 0.11177444458007812, 0.1199493408203125, 0.12812423706054688, 0.13629913330078125, 0.14447402954101562, 0.15264892578125, 0.16082382202148438, 0.16899871826171875, 0.17717361450195312, 0.1853485107421875, 0.19352340698242188, 0.20169830322265625, 0.20987319946289062, 0.218048095703125, 0.22622299194335938, 0.23439788818359375, 0.24257278442382812, 0.2507476806640625, 0.2589225769042969, 0.26709747314453125, 0.2752723693847656, 0.283447265625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 4.0, 5.0, 3.0, 4.0, 8.0, 16.0, 12.0, 29.0, 38.0, 68.0, 165.0, 328.0, 1143.0, 1459.0, 396.0, 169.0, 98.0, 47.0, 24.0, 16.0, 13.0, 10.0, 6.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1126708984375, -0.10865974426269531, -0.10464859008789062, -0.10063743591308594, -0.09662628173828125, -0.09261512756347656, -0.08860397338867188, -0.08459281921386719, -0.0805816650390625, -0.07657051086425781, -0.07255935668945312, -0.06854820251464844, -0.06453704833984375, -0.06052589416503906, -0.056514739990234375, -0.05250358581542969, -0.048492431640625, -0.04448127746582031, -0.040470123291015625, -0.03645896911621094, -0.03244781494140625, -0.028436660766601562, -0.024425506591796875, -0.020414352416992188, -0.0164031982421875, -0.012392044067382812, -0.008380889892578125, -0.0043697357177734375, -0.00035858154296875, 0.0036525726318359375, 0.007663726806640625, 0.011674880981445312, 0.01568603515625, 0.019697189331054688, 0.023708343505859375, 0.027719497680664062, 0.03173065185546875, 0.03574180603027344, 0.039752960205078125, 0.04376411437988281, 0.0477752685546875, 0.05178642272949219, 0.055797576904296875, 0.05980873107910156, 0.06381988525390625, 0.06783103942871094, 0.07184219360351562, 0.07585334777832031, 0.079864501953125, 0.08387565612792969, 0.08788681030273438, 0.09189796447753906, 0.09590911865234375, 0.09992027282714844, 0.10393142700195312, 0.10794258117675781, 0.1119537353515625, 0.11596488952636719, 0.11997604370117188, 0.12398719787597656, 0.12799835205078125, 0.13200950622558594, 0.13602066040039062, 0.1400318145751953, 0.14404296875]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 6.0, 7.0, 15.0, 45.0, 51.0, 114.0, 171.0, 208.0, 172.0, 111.0, 60.0, 23.0, 14.0, 8.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5676390528678894, -0.5452802777290344, -0.5229215025901794, -0.5005627274513245, -0.4782039523124695, -0.4558451771736145, -0.4334864318370819, -0.41112765669822693, -0.38876888155937195, -0.36641010642051697, -0.344051331281662, -0.3216925859451294, -0.2993338108062744, -0.27697503566741943, -0.25461626052856445, -0.23225748538970947, -0.2098987102508545, -0.1875399351119995, -0.16518115997314453, -0.14282239973545074, -0.12046362459659576, -0.09810484945774078, -0.075746089220047, -0.05338731408119202, -0.031028538942337036, -0.008669767528772354, 0.013689003884792328, 0.03604777157306671, 0.05840654671192169, 0.08076532185077667, 0.10312408208847046, 0.12548285722732544, 0.14784163236618042, 0.1702004075050354, 0.19255918264389038, 0.21491794288158417, 0.23727671802043915, 0.2596355080604553, 0.2819942533969879, 0.3043530285358429, 0.3267118036746979, 0.34907057881355286, 0.37142935395240784, 0.39378809928894043, 0.4161468744277954, 0.4385056495666504, 0.46086442470550537, 0.48322319984436035, 0.5055819749832153, 0.5279407501220703, 0.5502995252609253, 0.5726583003997803, 0.5950170755386353, 0.6173758506774902, 0.6397346258163452, 0.6620934009552002, 0.6844521760940552, 0.7068109512329102, 0.7291697263717651, 0.7515285015106201, 0.7738872766494751, 0.7962460517883301, 0.8186048269271851, 0.84096360206604, 0.8633223176002502]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 7.0, 3.0, 3.0, 6.0, 8.0, 15.0, 11.0, 5.0, 26.0, 20.0, 21.0, 34.0, 29.0, 43.0, 44.0, 47.0, 46.0, 44.0, 47.0, 45.0, 53.0, 51.0, 49.0, 44.0, 41.0, 31.0, 32.0, 41.0, 29.0, 23.0, 14.0, 15.0, 15.0, 12.0, 15.0, 10.0, 6.0, 7.0, 6.0, 2.0, 4.0, 1.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.3764731287956238, -0.36572128534317017, -0.35496947169303894, -0.3442176282405853, -0.3334658145904541, -0.3227139711380005, -0.3119621276855469, -0.30121028423309326, -0.29045847058296204, -0.2797066271305084, -0.2689548134803772, -0.2582029700279236, -0.24745114147663116, -0.23669931292533875, -0.22594746947288513, -0.2151956409215927, -0.2044438123703003, -0.19369198381900787, -0.18294015526771545, -0.17218831181526184, -0.16143648326396942, -0.150684654712677, -0.1399328112602234, -0.12918098270893097, -0.11842915415763855, -0.10767732560634613, -0.09692548960447311, -0.0861736536026001, -0.07542182505130768, -0.06466999650001526, -0.05391816049814224, -0.043166324496269226, -0.03241449594497681, -0.02166266366839409, -0.01091083139181137, -0.00015899911522865295, 0.010592833161354065, 0.021344665437936783, 0.0320964977145195, 0.04284833371639252, 0.053600162267684937, 0.06435199081897736, 0.07510382682085037, 0.08585566282272339, 0.09660749137401581, 0.10735931992530823, 0.11811115592718124, 0.12886299192905426, 0.13961482048034668, 0.1503666490316391, 0.16111847758293152, 0.17187032103538513, 0.18262214958667755, 0.19337397813796997, 0.20412582159042358, 0.214877650141716, 0.22562947869300842, 0.23638130724430084, 0.24713313579559326, 0.2578849792480469, 0.2686368227005005, 0.2793886363506317, 0.2901404798030853, 0.30089229345321655, 0.31164413690567017]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 3.0, 5.0, 5.0, 4.0, 11.0, 8.0, 20.0, 21.0, 40.0, 43.0, 77.0, 132.0, 215.0, 389.0, 777.0, 1677.0, 4070.0, 12923.0, 64732.0, 571501.0, 335737.0, 40771.0, 9369.0, 3205.0, 1306.0, 639.0, 345.0, 196.0, 110.0, 78.0, 51.0, 32.0, 22.0, 14.0, 10.0, 9.0, 11.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.421875, -0.40775299072265625, -0.3936309814453125, -0.37950897216796875, -0.365386962890625, -0.35126495361328125, -0.3371429443359375, -0.32302093505859375, -0.30889892578125, -0.29477691650390625, -0.2806549072265625, -0.26653289794921875, -0.252410888671875, -0.23828887939453125, -0.2241668701171875, -0.21004486083984375, -0.1959228515625, -0.18180084228515625, -0.1676788330078125, -0.15355682373046875, -0.139434814453125, -0.12531280517578125, -0.1111907958984375, -0.09706878662109375, -0.08294677734375, -0.06882476806640625, -0.0547027587890625, -0.04058074951171875, -0.026458740234375, -0.01233673095703125, 0.0017852783203125, 0.01590728759765625, 0.030029296875, 0.04415130615234375, 0.0582733154296875, 0.07239532470703125, 0.086517333984375, 0.10063934326171875, 0.1147613525390625, 0.12888336181640625, 0.14300537109375, 0.15712738037109375, 0.1712493896484375, 0.18537139892578125, 0.199493408203125, 0.21361541748046875, 0.2277374267578125, 0.24185943603515625, 0.2559814453125, 0.27010345458984375, 0.2842254638671875, 0.29834747314453125, 0.312469482421875, 0.32659149169921875, 0.3407135009765625, 0.35483551025390625, 0.36895751953125, 0.38307952880859375, 0.3972015380859375, 0.41132354736328125, 0.425445556640625, 0.43956756591796875, 0.4536895751953125, 0.46781158447265625, 0.48193359375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 3.0, 5.0, 4.0, 10.0, 17.0, 11.0, 36.0, 57.0, 64.0, 67.0, 78.0, 99.0, 108.0, 98.0, 84.0, 70.0, 62.0, 33.0, 26.0, 21.0, 15.0, 11.0, 8.0, 4.0, 3.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.125732421875, -0.12077522277832031, -0.11581802368164062, -0.11086082458496094, -0.10590362548828125, -0.10094642639160156, -0.09598922729492188, -0.09103202819824219, -0.0860748291015625, -0.08111763000488281, -0.07616043090820312, -0.07120323181152344, -0.06624603271484375, -0.06128883361816406, -0.056331634521484375, -0.05137443542480469, -0.046417236328125, -0.04146003723144531, -0.036502838134765625, -0.03154563903808594, -0.02658843994140625, -0.021631240844726562, -0.016674041748046875, -0.011716842651367188, -0.0067596435546875, -0.0018024444580078125, 0.003154754638671875, 0.008111953735351562, 0.01306915283203125, 0.018026351928710938, 0.022983551025390625, 0.027940750122070312, 0.03289794921875, 0.03785514831542969, 0.042812347412109375, 0.04776954650878906, 0.05272674560546875, 0.05768394470214844, 0.06264114379882812, 0.06759834289550781, 0.0725555419921875, 0.07751274108886719, 0.08246994018554688, 0.08742713928222656, 0.09238433837890625, 0.09734153747558594, 0.10229873657226562, 0.10725593566894531, 0.112213134765625, 0.11717033386230469, 0.12212753295898438, 0.12708473205566406, 0.13204193115234375, 0.13699913024902344, 0.14195632934570312, 0.1469135284423828, 0.1518707275390625, 0.1568279266357422, 0.16178512573242188, 0.16674232482910156, 0.17169952392578125, 0.17665672302246094, 0.18161392211914062, 0.1865711212158203, 0.1915283203125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 6.0, 4.0, 6.0, 3.0, 12.0, 5.0, 9.0, 17.0, 19.0, 43.0, 40.0, 53.0, 100.0, 106.0, 224.0, 348.0, 557.0, 1124.0, 2504.0, 6108.0, 17899.0, 67399.0, 316621.0, 484074.0, 109158.0, 27030.0, 8498.0, 3297.0, 1475.0, 681.0, 385.0, 237.0, 154.0, 100.0, 72.0, 53.0, 28.0, 27.0, 24.0, 22.0, 13.0, 9.0, 6.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.264892578125, -0.2566566467285156, -0.24842071533203125, -0.24018478393554688, -0.2319488525390625, -0.22371292114257812, -0.21547698974609375, -0.20724105834960938, -0.199005126953125, -0.19076919555664062, -0.18253326416015625, -0.17429733276367188, -0.1660614013671875, -0.15782546997070312, -0.14958953857421875, -0.14135360717773438, -0.13311767578125, -0.12488174438476562, -0.11664581298828125, -0.10840988159179688, -0.1001739501953125, -0.09193801879882812, -0.08370208740234375, -0.07546615600585938, -0.067230224609375, -0.058994293212890625, -0.05075836181640625, -0.042522430419921875, -0.0342864990234375, -0.026050567626953125, -0.01781463623046875, -0.009578704833984375, -0.0013427734375, 0.006893157958984375, 0.01512908935546875, 0.023365020751953125, 0.0316009521484375, 0.039836883544921875, 0.04807281494140625, 0.056308746337890625, 0.064544677734375, 0.07278060913085938, 0.08101654052734375, 0.08925247192382812, 0.0974884033203125, 0.10572433471679688, 0.11396026611328125, 0.12219619750976562, 0.13043212890625, 0.13866806030273438, 0.14690399169921875, 0.15513992309570312, 0.1633758544921875, 0.17161178588867188, 0.17984771728515625, 0.18808364868164062, 0.196319580078125, 0.20455551147460938, 0.21279144287109375, 0.22102737426757812, 0.2292633056640625, 0.23749923706054688, 0.24573516845703125, 0.2539710998535156, 0.26220703125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 4.0, 2.0, 2.0, 7.0, 1.0, 4.0, 8.0, 9.0, 8.0, 15.0, 10.0, 20.0, 20.0, 16.0, 27.0, 38.0, 35.0, 40.0, 38.0, 43.0, 35.0, 46.0, 38.0, 45.0, 58.0, 42.0, 49.0, 39.0, 32.0, 27.0, 40.0, 30.0, 38.0, 22.0, 22.0, 10.0, 18.0, 10.0, 10.0, 11.0, 11.0, 5.0, 6.0, 3.0, 3.0, 5.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.362548828125, -0.35205078125, -0.341552734375, -0.3310546875, -0.320556640625, -0.31005859375, -0.299560546875, -0.2890625, -0.278564453125, -0.26806640625, -0.257568359375, -0.2470703125, -0.236572265625, -0.22607421875, -0.215576171875, -0.205078125, -0.194580078125, -0.18408203125, -0.173583984375, -0.1630859375, -0.152587890625, -0.14208984375, -0.131591796875, -0.12109375, -0.110595703125, -0.10009765625, -0.089599609375, -0.0791015625, -0.068603515625, -0.05810546875, -0.047607421875, -0.037109375, -0.026611328125, -0.01611328125, -0.005615234375, 0.0048828125, 0.015380859375, 0.02587890625, 0.036376953125, 0.046875, 0.057373046875, 0.06787109375, 0.078369140625, 0.0888671875, 0.099365234375, 0.10986328125, 0.120361328125, 0.130859375, 0.141357421875, 0.15185546875, 0.162353515625, 0.1728515625, 0.183349609375, 0.19384765625, 0.204345703125, 0.21484375, 0.225341796875, 0.23583984375, 0.246337890625, 0.2568359375, 0.267333984375, 0.27783203125, 0.288330078125, 0.298828125, 0.309326171875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 7.0, 5.0, 7.0, 17.0, 22.0, 40.0, 74.0, 140.0, 265.0, 651.0, 2247.0, 13589.0, 143328.0, 815074.0, 63788.0, 6966.0, 1401.0, 456.0, 214.0, 110.0, 58.0, 34.0, 12.0, 13.0, 9.0, 9.0, 10.0, 1.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1455078125, -0.1410083770751953, -0.13650894165039062, -0.13200950622558594, -0.12751007080078125, -0.12301063537597656, -0.11851119995117188, -0.11401176452636719, -0.1095123291015625, -0.10501289367675781, -0.10051345825195312, -0.09601402282714844, -0.09151458740234375, -0.08701515197753906, -0.08251571655273438, -0.07801628112792969, -0.073516845703125, -0.06901741027832031, -0.06451797485351562, -0.06001853942871094, -0.05551910400390625, -0.05101966857910156, -0.046520233154296875, -0.04202079772949219, -0.0375213623046875, -0.03302192687988281, -0.028522491455078125, -0.024023056030273438, -0.01952362060546875, -0.015024185180664062, -0.010524749755859375, -0.0060253143310546875, -0.00152587890625, 0.0029735565185546875, 0.007472991943359375, 0.011972427368164062, 0.01647186279296875, 0.020971298217773438, 0.025470733642578125, 0.029970169067382812, 0.0344696044921875, 0.03896903991699219, 0.043468475341796875, 0.04796791076660156, 0.05246734619140625, 0.05696678161621094, 0.061466217041015625, 0.06596565246582031, 0.070465087890625, 0.07496452331542969, 0.07946395874023438, 0.08396339416503906, 0.08846282958984375, 0.09296226501464844, 0.09746170043945312, 0.10196113586425781, 0.1064605712890625, 0.11096000671386719, 0.11545944213867188, 0.11995887756347656, 0.12445831298828125, 0.12895774841308594, 0.13345718383789062, 0.1379566192626953, 0.1424560546875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 5.0, 2.0, 5.0, 6.0, 7.0, 12.0, 15.0, 10.0, 12.0, 14.0, 23.0, 26.0, 33.0, 62.0, 74.0, 89.0, 112.0, 99.0, 112.0, 69.0, 39.0, 36.0, 37.0, 10.0, 22.0, 11.0, 7.0, 12.0, 10.0, 10.0, 8.0, 6.0, 3.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.069110870361328e-05, -6.807222962379456e-05, -6.545335054397583e-05, -6.28344714641571e-05, -6.021559238433838e-05, -5.759671330451965e-05, -5.497783422470093e-05, -5.23589551448822e-05, -4.9740076065063477e-05, -4.712119698524475e-05, -4.4502317905426025e-05, -4.18834388256073e-05, -3.9264559745788574e-05, -3.664568066596985e-05, -3.402680158615112e-05, -3.14079225063324e-05, -2.8789043426513672e-05, -2.6170164346694946e-05, -2.355128526687622e-05, -2.0932406187057495e-05, -1.831352710723877e-05, -1.5694648027420044e-05, -1.3075768947601318e-05, -1.0456889867782593e-05, -7.838010787963867e-06, -5.219131708145142e-06, -2.600252628326416e-06, 1.862645149230957e-08, 2.637505531311035e-06, 5.256384611129761e-06, 7.875263690948486e-06, 1.0494142770767212e-05, 1.3113021850585938e-05, 1.5731900930404663e-05, 1.835078001022339e-05, 2.0969659090042114e-05, 2.358853816986084e-05, 2.6207417249679565e-05, 2.882629632949829e-05, 3.1445175409317017e-05, 3.406405448913574e-05, 3.668293356895447e-05, 3.930181264877319e-05, 4.192069172859192e-05, 4.4539570808410645e-05, 4.715844988822937e-05, 4.9777328968048096e-05, 5.239620804786682e-05, 5.501508712768555e-05, 5.763396620750427e-05, 6.0252845287323e-05, 6.287172436714172e-05, 6.549060344696045e-05, 6.810948252677917e-05, 7.07283616065979e-05, 7.334724068641663e-05, 7.596611976623535e-05, 7.858499884605408e-05, 8.12038779258728e-05, 8.382275700569153e-05, 8.644163608551025e-05, 8.906051516532898e-05, 9.16793942451477e-05, 9.429827332496643e-05, 9.691715240478516e-05]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 7.0, 3.0, 7.0, 8.0, 12.0, 23.0, 34.0, 47.0, 85.0, 142.0, 228.0, 373.0, 792.0, 2424.0, 12623.0, 89913.0, 781210.0, 137081.0, 18314.0, 3200.0, 955.0, 463.0, 223.0, 161.0, 78.0, 57.0, 32.0, 21.0, 13.0, 7.0, 8.0, 3.0, 4.0, 3.0, 5.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11505126953125, -0.11088275909423828, -0.10671424865722656, -0.10254573822021484, -0.09837722778320312, -0.0942087173461914, -0.09004020690917969, -0.08587169647216797, -0.08170318603515625, -0.07753467559814453, -0.07336616516113281, -0.0691976547241211, -0.06502914428710938, -0.060860633850097656, -0.05669212341308594, -0.05252361297607422, -0.0483551025390625, -0.04418659210205078, -0.04001808166503906, -0.035849571228027344, -0.031681060791015625, -0.027512550354003906, -0.023344039916992188, -0.01917552947998047, -0.01500701904296875, -0.010838508605957031, -0.0066699981689453125, -0.0025014877319335938, 0.001667022705078125, 0.005835533142089844, 0.010004043579101562, 0.014172554016113281, 0.018341064453125, 0.02250957489013672, 0.026678085327148438, 0.030846595764160156, 0.035015106201171875, 0.039183616638183594, 0.04335212707519531, 0.04752063751220703, 0.05168914794921875, 0.05585765838623047, 0.06002616882324219, 0.0641946792602539, 0.06836318969726562, 0.07253170013427734, 0.07670021057128906, 0.08086872100830078, 0.0850372314453125, 0.08920574188232422, 0.09337425231933594, 0.09754276275634766, 0.10171127319335938, 0.1058797836303711, 0.11004829406738281, 0.11421680450439453, 0.11838531494140625, 0.12255382537841797, 0.1267223358154297, 0.1308908462524414, 0.13505935668945312, 0.13922786712646484, 0.14339637756347656, 0.14756488800048828, 0.1517333984375]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 13.0, 14.0, 11.0, 19.0, 28.0, 37.0, 33.0, 59.0, 75.0, 122.0, 167.0, 148.0, 84.0, 48.0, 41.0, 32.0, 24.0, 17.0, 4.0, 10.0, 11.0, 4.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1395263671875, -0.1362628936767578, -0.13299942016601562, -0.12973594665527344, -0.12647247314453125, -0.12320899963378906, -0.11994552612304688, -0.11668205261230469, -0.1134185791015625, -0.11015510559082031, -0.10689163208007812, -0.10362815856933594, -0.10036468505859375, -0.09710121154785156, -0.09383773803710938, -0.09057426452636719, -0.087310791015625, -0.08404731750488281, -0.08078384399414062, -0.07752037048339844, -0.07425689697265625, -0.07099342346191406, -0.06772994995117188, -0.06446647644042969, -0.0612030029296875, -0.05793952941894531, -0.054676055908203125, -0.05141258239746094, -0.04814910888671875, -0.04488563537597656, -0.041622161865234375, -0.03835868835449219, -0.03509521484375, -0.03183174133300781, -0.028568267822265625, -0.025304794311523438, -0.02204132080078125, -0.018777847290039062, -0.015514373779296875, -0.012250900268554688, -0.0089874267578125, -0.0057239532470703125, -0.002460479736328125, 0.0008029937744140625, 0.00406646728515625, 0.0073299407958984375, 0.010593414306640625, 0.013856887817382812, 0.017120361328125, 0.020383834838867188, 0.023647308349609375, 0.026910781860351562, 0.03017425537109375, 0.03343772888183594, 0.036701202392578125, 0.03996467590332031, 0.0432281494140625, 0.04649162292480469, 0.049755096435546875, 0.05301856994628906, 0.05628204345703125, 0.05954551696777344, 0.06280899047851562, 0.06607246398925781, 0.0693359375]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 3.0, 9.0, 44.0, 143.0, 369.0, 310.0, 99.0, 21.0, 9.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6809935569763184, -3.5433645248413086, -3.405735731124878, -3.2681069374084473, -3.1304779052734375, -2.9928488731384277, -2.855220079421997, -2.7175912857055664, -2.5799622535705566, -2.442333221435547, -2.304704427719116, -2.1670756340026855, -2.029446601867676, -1.8918176889419556, -1.7541887760162354, -1.6165598630905151, -1.478930950164795, -1.3413020372390747, -1.2036731243133545, -1.0660442113876343, -0.9284152984619141, -0.7907863855361938, -0.6531574726104736, -0.5155285596847534, -0.3778996467590332, -0.240270733833313, -0.10264182090759277, 0.03498709201812744, 0.17261600494384766, 0.31024491786956787, 0.4478738307952881, 0.5855027437210083, 0.7231311798095703, 0.8607600927352905, 0.9983890056610107, 1.136017918586731, 1.2736468315124512, 1.4112757444381714, 1.5489046573638916, 1.6865335702896118, 1.824162483215332, 1.9617913961410522, 2.0994203090667725, 2.237049102783203, 2.374678134918213, 2.5123071670532227, 2.6499359607696533, 2.787564754486084, 2.9251937866210938, 3.0628228187561035, 3.200451612472534, 3.338080406188965, 3.4757094383239746, 3.6133384704589844, 3.750967264175415, 3.8885960578918457, 4.0262250900268555, 4.163854122161865, 4.301483154296875, 4.439111709594727, 4.576740741729736, 4.714369773864746, 4.851998329162598, 4.989627361297607, 5.127256393432617]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 4.0, 5.0, 2.0, 0.0, 8.0, 10.0, 14.0, 15.0, 8.0, 16.0, 14.0, 17.0, 18.0, 26.0, 34.0, 28.0, 29.0, 33.0, 39.0, 41.0, 29.0, 46.0, 47.0, 33.0, 32.0, 53.0, 36.0, 43.0, 39.0, 38.0, 27.0, 33.0, 26.0, 23.0, 17.0, 28.0, 19.0, 17.0, 12.0, 11.0, 7.0, 4.0, 8.0, 3.0, 3.0, 6.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.3635234832763672, -1.3164212703704834, -1.26931893825531, -1.2222166061401367, -1.175114393234253, -1.1280121803283691, -1.0809098482131958, -1.0338075160980225, -0.9867053031921387, -0.9396030306816101, -0.8925007581710815, -0.845398485660553, -0.7982962131500244, -0.7511939406394958, -0.7040916681289673, -0.6569893956184387, -0.6098871231079102, -0.5627848505973816, -0.515682578086853, -0.46858030557632446, -0.4214780330657959, -0.37437576055526733, -0.32727348804473877, -0.2801712155342102, -0.23306894302368164, -0.18596667051315308, -0.1388643980026245, -0.09176212549209595, -0.04465985298156738, 0.0024424195289611816, 0.049544692039489746, 0.09664696455001831, 0.14374923706054688, 0.19085150957107544, 0.237953782081604, 0.28505605459213257, 0.33215832710266113, 0.3792605996131897, 0.42636287212371826, 0.4734651446342468, 0.5205674171447754, 0.567669689655304, 0.6147719621658325, 0.6618742346763611, 0.7089765071868896, 0.7560787796974182, 0.8031810522079468, 0.8502833247184753, 0.8973855972290039, 0.9444878697395325, 0.991590142250061, 1.0386924743652344, 1.0857946872711182, 1.132896900177002, 1.1799992322921753, 1.2271015644073486, 1.2742037773132324, 1.3213059902191162, 1.3684083223342896, 1.415510654449463, 1.4626128673553467, 1.5097150802612305, 1.5568174123764038, 1.6039197444915771, 1.651021957397461]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 6.0, 9.0, 11.0, 18.0, 15.0, 24.0, 37.0, 64.0, 100.0, 146.0, 211.0, 372.0, 668.0, 1313.0, 2902.0, 7368.0, 28182.0, 323720.0, 3737338.0, 70011.0, 13447.0, 4446.0, 1812.0, 869.0, 475.0, 247.0, 132.0, 99.0, 73.0, 41.0, 24.0, 22.0, 18.0, 7.0, 20.0, 6.0, 4.0, 9.0, 5.0, 4.0, 4.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.315673828125, -0.30449676513671875, -0.2933197021484375, -0.28214263916015625, -0.270965576171875, -0.25978851318359375, -0.2486114501953125, -0.23743438720703125, -0.22625732421875, -0.21508026123046875, -0.2039031982421875, -0.19272613525390625, -0.181549072265625, -0.17037200927734375, -0.1591949462890625, -0.14801788330078125, -0.1368408203125, -0.12566375732421875, -0.1144866943359375, -0.10330963134765625, -0.092132568359375, -0.08095550537109375, -0.0697784423828125, -0.05860137939453125, -0.04742431640625, -0.03624725341796875, -0.0250701904296875, -0.01389312744140625, -0.002716064453125, 0.00846099853515625, 0.0196380615234375, 0.03081512451171875, 0.0419921875, 0.05316925048828125, 0.0643463134765625, 0.07552337646484375, 0.086700439453125, 0.09787750244140625, 0.1090545654296875, 0.12023162841796875, 0.13140869140625, 0.14258575439453125, 0.1537628173828125, 0.16493988037109375, 0.176116943359375, 0.18729400634765625, 0.1984710693359375, 0.20964813232421875, 0.2208251953125, 0.23200225830078125, 0.2431793212890625, 0.25435638427734375, 0.265533447265625, 0.27671051025390625, 0.2878875732421875, 0.29906463623046875, 0.31024169921875, 0.32141876220703125, 0.3325958251953125, 0.34377288818359375, 0.354949951171875, 0.36612701416015625, 0.3773040771484375, 0.38848114013671875, 0.399658203125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 4.0, 2.0, 7.0, 2.0, 13.0, 8.0, 15.0, 32.0, 41.0, 64.0, 74.0, 102.0, 81.0, 127.0, 99.0, 88.0, 76.0, 50.0, 37.0, 29.0, 23.0, 10.0, 7.0, 5.0, 6.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1435546875, -0.1379108428955078, -0.13226699829101562, -0.12662315368652344, -0.12097930908203125, -0.11533546447753906, -0.10969161987304688, -0.10404777526855469, -0.0984039306640625, -0.09276008605957031, -0.08711624145507812, -0.08147239685058594, -0.07582855224609375, -0.07018470764160156, -0.06454086303710938, -0.05889701843261719, -0.053253173828125, -0.04760932922363281, -0.041965484619140625, -0.03632164001464844, -0.03067779541015625, -0.025033950805664062, -0.019390106201171875, -0.013746261596679688, -0.0081024169921875, -0.0024585723876953125, 0.003185272216796875, 0.008829116821289062, 0.01447296142578125, 0.020116806030273438, 0.025760650634765625, 0.03140449523925781, 0.03704833984375, 0.04269218444824219, 0.048336029052734375, 0.05397987365722656, 0.05962371826171875, 0.06526756286621094, 0.07091140747070312, 0.07655525207519531, 0.0821990966796875, 0.08784294128417969, 0.09348678588867188, 0.09913063049316406, 0.10477447509765625, 0.11041831970214844, 0.11606216430664062, 0.12170600891113281, 0.127349853515625, 0.1329936981201172, 0.13863754272460938, 0.14428138732910156, 0.14992523193359375, 0.15556907653808594, 0.16121292114257812, 0.1668567657470703, 0.1725006103515625, 0.1781444549560547, 0.18378829956054688, 0.18943214416503906, 0.19507598876953125, 0.20071983337402344, 0.20636367797851562, 0.2120075225830078, 0.2176513671875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 7.0, 9.0, 12.0, 13.0, 23.0, 46.0, 77.0, 77.0, 129.0, 209.0, 353.0, 524.0, 928.0, 1604.0, 3030.0, 6791.0, 19666.0, 88169.0, 2359282.0, 1602550.0, 79159.0, 18520.0, 6589.0, 2831.0, 1477.0, 839.0, 491.0, 311.0, 205.0, 141.0, 81.0, 49.0, 29.0, 22.0, 20.0, 9.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.231201171875, -0.2249469757080078, -0.21869277954101562, -0.21243858337402344, -0.20618438720703125, -0.19993019104003906, -0.19367599487304688, -0.1874217987060547, -0.1811676025390625, -0.1749134063720703, -0.16865921020507812, -0.16240501403808594, -0.15615081787109375, -0.14989662170410156, -0.14364242553710938, -0.1373882293701172, -0.131134033203125, -0.12487983703613281, -0.11862564086914062, -0.11237144470214844, -0.10611724853515625, -0.09986305236816406, -0.09360885620117188, -0.08735466003417969, -0.0811004638671875, -0.07484626770019531, -0.06859207153320312, -0.06233787536621094, -0.05608367919921875, -0.04982948303222656, -0.043575286865234375, -0.03732109069824219, -0.03106689453125, -0.024812698364257812, -0.018558502197265625, -0.012304306030273438, -0.00605010986328125, 0.0002040863037109375, 0.006458282470703125, 0.012712478637695312, 0.0189666748046875, 0.025220870971679688, 0.031475067138671875, 0.03772926330566406, 0.04398345947265625, 0.05023765563964844, 0.056491851806640625, 0.06274604797363281, 0.069000244140625, 0.07525444030761719, 0.08150863647460938, 0.08776283264160156, 0.09401702880859375, 0.10027122497558594, 0.10652542114257812, 0.11277961730957031, 0.1190338134765625, 0.1252880096435547, 0.13154220581054688, 0.13779640197753906, 0.14405059814453125, 0.15030479431152344, 0.15655899047851562, 0.1628131866455078, 0.1690673828125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 6.0, 1.0, 6.0, 3.0, 10.0, 12.0, 20.0, 25.0, 52.0, 86.0, 249.0, 711.0, 1926.0, 551.0, 184.0, 82.0, 43.0, 33.0, 21.0, 13.0, 7.0, 13.0, 4.0, 0.0, 7.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.11767578125, -0.11425304412841797, -0.11083030700683594, -0.1074075698852539, -0.10398483276367188, -0.10056209564208984, -0.09713935852050781, -0.09371662139892578, -0.09029388427734375, -0.08687114715576172, -0.08344841003417969, -0.08002567291259766, -0.07660293579101562, -0.0731801986694336, -0.06975746154785156, -0.06633472442626953, -0.0629119873046875, -0.05948925018310547, -0.05606651306152344, -0.052643775939941406, -0.049221038818359375, -0.045798301696777344, -0.04237556457519531, -0.03895282745361328, -0.03553009033203125, -0.03210735321044922, -0.028684616088867188, -0.025261878967285156, -0.021839141845703125, -0.018416404724121094, -0.014993667602539062, -0.011570930480957031, -0.008148193359375, -0.004725456237792969, -0.0013027191162109375, 0.0021200180053710938, 0.005542755126953125, 0.008965492248535156, 0.012388229370117188, 0.01581096649169922, 0.01923370361328125, 0.02265644073486328, 0.026079177856445312, 0.029501914978027344, 0.032924652099609375, 0.036347389221191406, 0.03977012634277344, 0.04319286346435547, 0.0466156005859375, 0.05003833770751953, 0.05346107482910156, 0.056883811950683594, 0.060306549072265625, 0.06372928619384766, 0.06715202331542969, 0.07057476043701172, 0.07399749755859375, 0.07742023468017578, 0.08084297180175781, 0.08426570892333984, 0.08768844604492188, 0.0911111831665039, 0.09453392028808594, 0.09795665740966797, 0.10137939453125]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 7.0, 9.0, 17.0, 37.0, 100.0, 155.0, 193.0, 189.0, 142.0, 78.0, 29.0, 19.0, 11.0, 7.0, 2.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8660962581634521, -0.8459039330482483, -0.8257116079330444, -0.8055192828178406, -0.7853269577026367, -0.7651346325874329, -0.744942307472229, -0.7247500419616699, -0.7045576572418213, -0.6843653321266174, -0.6641730070114136, -0.6439806818962097, -0.6237883567810059, -0.603596031665802, -0.5834037065505981, -0.5632114410400391, -0.5430191159248352, -0.5228267908096313, -0.5026344656944275, -0.48244214057922363, -0.4622498154640198, -0.4420574903488159, -0.42186519503593445, -0.4016728699207306, -0.38148054480552673, -0.3612882196903229, -0.341095894575119, -0.32090356945991516, -0.3007112741470337, -0.28051894903182983, -0.260326623916626, -0.24013429880142212, -0.21994197368621826, -0.1997496485710144, -0.17955732345581055, -0.15936501324176788, -0.13917268812656403, -0.11898036301136017, -0.09878804534673691, -0.07859572768211365, -0.05840340256690979, -0.03821108117699623, -0.018018759787082672, 0.002173561602830887, 0.022365882992744446, 0.0425582081079483, 0.06275052577257156, 0.08294284343719482, 0.10313516855239868, 0.12332749366760254, 0.1435198187828064, 0.16371212899684906, 0.18390445411205292, 0.20409677922725677, 0.22428908944129944, 0.2444814145565033, 0.26467373967170715, 0.284866064786911, 0.30505838990211487, 0.3252507150173187, 0.3454430103302002, 0.36563533544540405, 0.3858276605606079, 0.40601998567581177, 0.4262123107910156]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 7.0, 6.0, 10.0, 19.0, 17.0, 20.0, 19.0, 38.0, 33.0, 32.0, 34.0, 34.0, 46.0, 34.0, 54.0, 49.0, 56.0, 55.0, 44.0, 45.0, 41.0, 47.0, 40.0, 31.0, 24.0, 32.0, 26.0, 17.0, 26.0, 16.0, 9.0, 12.0, 5.0, 6.0, 10.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.36335307359695435, -0.3531562387943268, -0.3429594039916992, -0.33276256918907166, -0.3225657343864441, -0.3123689293861389, -0.30217209458351135, -0.2919752597808838, -0.2817784249782562, -0.27158159017562866, -0.2613847553730011, -0.25118792057037354, -0.24099110066890717, -0.2307942658662796, -0.22059744596481323, -0.21040061116218567, -0.2002037763595581, -0.19000694155693054, -0.17981010675430298, -0.1696132868528366, -0.15941645205020905, -0.14921961724758148, -0.1390227973461151, -0.12882596254348755, -0.11862912774085999, -0.10843229293823242, -0.09823546558618546, -0.08803863823413849, -0.07784180343151093, -0.06764496862888336, -0.057448141276836395, -0.04725131392478943, -0.037054479122161865, -0.0268576480448246, -0.016660816967487335, -0.00646398589015007, 0.003732845187187195, 0.01392967626452446, 0.024126507341861725, 0.03432333469390869, 0.044520169496536255, 0.05471700057387352, 0.06491383165121078, 0.07511065900325775, 0.08530749380588531, 0.09550432860851288, 0.10570115596055984, 0.11589798331260681, 0.12609481811523438, 0.13629165291786194, 0.1464884877204895, 0.15668530762195587, 0.16688214242458344, 0.177078977227211, 0.18727579712867737, 0.19747263193130493, 0.2076694667339325, 0.21786630153656006, 0.22806313633918762, 0.238259956240654, 0.24845679104328156, 0.2586536109447479, 0.2688504457473755, 0.27904728055000305, 0.2892441153526306]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 8.0, 9.0, 3.0, 13.0, 19.0, 45.0, 95.0, 171.0, 323.0, 746.0, 2142.0, 9894.0, 111795.0, 828640.0, 83116.0, 8316.0, 1941.0, 643.0, 301.0, 156.0, 80.0, 41.0, 15.0, 14.0, 14.0, 5.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.5654296875, -0.5455551147460938, -0.5256805419921875, -0.5058059692382812, -0.485931396484375, -0.46605682373046875, -0.4461822509765625, -0.42630767822265625, -0.40643310546875, -0.38655853271484375, -0.3666839599609375, -0.34680938720703125, -0.326934814453125, -0.30706024169921875, -0.2871856689453125, -0.26731109619140625, -0.2474365234375, -0.22756195068359375, -0.2076873779296875, -0.18781280517578125, -0.167938232421875, -0.14806365966796875, -0.1281890869140625, -0.10831451416015625, -0.08843994140625, -0.06856536865234375, -0.0486907958984375, -0.02881622314453125, -0.008941650390625, 0.01093292236328125, 0.0308074951171875, 0.05068206787109375, 0.070556640625, 0.09043121337890625, 0.1103057861328125, 0.13018035888671875, 0.150054931640625, 0.16992950439453125, 0.1898040771484375, 0.20967864990234375, 0.22955322265625, 0.24942779541015625, 0.2693023681640625, 0.28917694091796875, 0.309051513671875, 0.32892608642578125, 0.3488006591796875, 0.36867523193359375, 0.3885498046875, 0.40842437744140625, 0.4282989501953125, 0.44817352294921875, 0.468048095703125, 0.48792266845703125, 0.5077972412109375, 0.5276718139648438, 0.54754638671875, 0.5674209594726562, 0.5872955322265625, 0.6071701049804688, 0.627044677734375, 0.6469192504882812, 0.6667938232421875, 0.6866683959960938, 0.70654296875]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 4.0, 3.0, 11.0, 15.0, 18.0, 33.0, 37.0, 76.0, 78.0, 107.0, 85.0, 126.0, 111.0, 65.0, 75.0, 50.0, 36.0, 19.0, 20.0, 9.0, 9.0, 6.0, 1.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1466064453125, -0.14100074768066406, -0.13539505004882812, -0.1297893524169922, -0.12418365478515625, -0.11857795715332031, -0.11297225952148438, -0.10736656188964844, -0.1017608642578125, -0.09615516662597656, -0.09054946899414062, -0.08494377136230469, -0.07933807373046875, -0.07373237609863281, -0.06812667846679688, -0.06252098083496094, -0.056915283203125, -0.05130958557128906, -0.045703887939453125, -0.04009819030761719, -0.03449249267578125, -0.028886795043945312, -0.023281097412109375, -0.017675399780273438, -0.0120697021484375, -0.0064640045166015625, -0.000858306884765625, 0.0047473907470703125, 0.01035308837890625, 0.015958786010742188, 0.021564483642578125, 0.027170181274414062, 0.03277587890625, 0.03838157653808594, 0.043987274169921875, 0.04959297180175781, 0.05519866943359375, 0.06080436706542969, 0.06641006469726562, 0.07201576232910156, 0.0776214599609375, 0.08322715759277344, 0.08883285522460938, 0.09443855285644531, 0.10004425048828125, 0.10564994812011719, 0.11125564575195312, 0.11686134338378906, 0.122467041015625, 0.12807273864746094, 0.13367843627929688, 0.1392841339111328, 0.14488983154296875, 0.1504955291748047, 0.15610122680664062, 0.16170692443847656, 0.1673126220703125, 0.17291831970214844, 0.17852401733398438, 0.1841297149658203, 0.18973541259765625, 0.1953411102294922, 0.20094680786132812, 0.20655250549316406, 0.212158203125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 5.0, 4.0, 4.0, 8.0, 9.0, 15.0, 28.0, 43.0, 46.0, 94.0, 134.0, 246.0, 456.0, 902.0, 2213.0, 7237.0, 29225.0, 170920.0, 646858.0, 152599.0, 26714.0, 6617.0, 2252.0, 868.0, 461.0, 270.0, 125.0, 66.0, 40.0, 43.0, 21.0, 13.0, 10.0, 4.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.261962890625, -0.251678466796875, -0.24139404296875, -0.231109619140625, -0.2208251953125, -0.210540771484375, -0.20025634765625, -0.189971923828125, -0.1796875, -0.169403076171875, -0.15911865234375, -0.148834228515625, -0.1385498046875, -0.128265380859375, -0.11798095703125, -0.107696533203125, -0.097412109375, -0.087127685546875, -0.07684326171875, -0.066558837890625, -0.0562744140625, -0.045989990234375, -0.03570556640625, -0.025421142578125, -0.01513671875, -0.004852294921875, 0.00543212890625, 0.015716552734375, 0.0260009765625, 0.036285400390625, 0.04656982421875, 0.056854248046875, 0.067138671875, 0.077423095703125, 0.08770751953125, 0.097991943359375, 0.1082763671875, 0.118560791015625, 0.12884521484375, 0.139129638671875, 0.1494140625, 0.159698486328125, 0.16998291015625, 0.180267333984375, 0.1905517578125, 0.200836181640625, 0.21112060546875, 0.221405029296875, 0.231689453125, 0.241973876953125, 0.25225830078125, 0.262542724609375, 0.2728271484375, 0.283111572265625, 0.29339599609375, 0.303680419921875, 0.31396484375, 0.324249267578125, 0.33453369140625, 0.344818115234375, 0.3551025390625, 0.365386962890625, 0.37567138671875, 0.385955810546875, 0.396240234375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 5.0, 4.0, 9.0, 8.0, 17.0, 17.0, 23.0, 27.0, 42.0, 49.0, 50.0, 59.0, 65.0, 57.0, 73.0, 86.0, 59.0, 70.0, 50.0, 49.0, 48.0, 39.0, 26.0, 17.0, 17.0, 11.0, 7.0, 6.0, 9.0, 5.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.421630859375, -0.4060401916503906, -0.39044952392578125, -0.3748588562011719, -0.3592681884765625, -0.3436775207519531, -0.32808685302734375, -0.3124961853027344, -0.296905517578125, -0.2813148498535156, -0.26572418212890625, -0.2501335144042969, -0.2345428466796875, -0.21895217895507812, -0.20336151123046875, -0.18777084350585938, -0.17218017578125, -0.15658950805664062, -0.14099884033203125, -0.12540817260742188, -0.1098175048828125, -0.09422683715820312, -0.07863616943359375, -0.06304550170898438, -0.047454833984375, -0.031864166259765625, -0.01627349853515625, -0.000682830810546875, 0.0149078369140625, 0.030498504638671875, 0.04608917236328125, 0.061679840087890625, 0.0772705078125, 0.09286117553710938, 0.10845184326171875, 0.12404251098632812, 0.1396331787109375, 0.15522384643554688, 0.17081451416015625, 0.18640518188476562, 0.201995849609375, 0.21758651733398438, 0.23317718505859375, 0.24876785278320312, 0.2643585205078125, 0.2799491882324219, 0.29553985595703125, 0.3111305236816406, 0.32672119140625, 0.3423118591308594, 0.35790252685546875, 0.3734931945800781, 0.3890838623046875, 0.4046745300292969, 0.42026519775390625, 0.4358558654785156, 0.451446533203125, 0.4670372009277344, 0.48262786865234375, 0.4982185363769531, 0.5138092041015625, 0.5293998718261719, 0.5449905395507812, 0.5605812072753906, 0.576171875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 5.0, 4.0, 7.0, 11.0, 18.0, 46.0, 79.0, 206.0, 395.0, 1094.0, 3888.0, 19345.0, 141634.0, 783081.0, 81574.0, 12900.0, 2797.0, 782.0, 342.0, 163.0, 93.0, 40.0, 18.0, 13.0, 6.0, 7.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0933837890625, -0.08997344970703125, -0.0865631103515625, -0.08315277099609375, -0.079742431640625, -0.07633209228515625, -0.0729217529296875, -0.06951141357421875, -0.06610107421875, -0.06269073486328125, -0.0592803955078125, -0.05587005615234375, -0.052459716796875, -0.04904937744140625, -0.0456390380859375, -0.04222869873046875, -0.038818359375, -0.03540802001953125, -0.0319976806640625, -0.02858734130859375, -0.025177001953125, -0.02176666259765625, -0.0183563232421875, -0.01494598388671875, -0.01153564453125, -0.00812530517578125, -0.0047149658203125, -0.00130462646484375, 0.002105712890625, 0.00551605224609375, 0.0089263916015625, 0.01233673095703125, 0.0157470703125, 0.01915740966796875, 0.0225677490234375, 0.02597808837890625, 0.029388427734375, 0.03279876708984375, 0.0362091064453125, 0.03961944580078125, 0.04302978515625, 0.04644012451171875, 0.0498504638671875, 0.05326080322265625, 0.056671142578125, 0.06008148193359375, 0.0634918212890625, 0.06690216064453125, 0.0703125, 0.07372283935546875, 0.0771331787109375, 0.08054351806640625, 0.083953857421875, 0.08736419677734375, 0.0907745361328125, 0.09418487548828125, 0.09759521484375, 0.10100555419921875, 0.1044158935546875, 0.10782623291015625, 0.111236572265625, 0.11464691162109375, 0.1180572509765625, 0.12146759033203125, 0.1248779296875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 7.0, 5.0, 7.0, 7.0, 18.0, 25.0, 31.0, 44.0, 85.0, 146.0, 159.0, 160.0, 116.0, 65.0, 52.0, 27.0, 21.0, 15.0, 11.0, 6.0, 3.0, 0.0, 2.0], "bins": [-0.00022041797637939453, -0.00021615158766508102, -0.00021188519895076752, -0.000207618810236454, -0.0002033524215221405, -0.000199086032807827, -0.0001948196440935135, -0.00019055325537919998, -0.00018628686666488647, -0.00018202047795057297, -0.00017775408923625946, -0.00017348770052194595, -0.00016922131180763245, -0.00016495492309331894, -0.00016068853437900543, -0.00015642214566469193, -0.00015215575695037842, -0.0001478893682360649, -0.0001436229795217514, -0.0001393565908074379, -0.0001350902020931244, -0.00013082381337881088, -0.00012655742466449738, -0.00012229103595018387, -0.00011802464723587036, -0.00011375825852155685, -0.00010949186980724335, -0.00010522548109292984, -0.00010095909237861633, -9.669270366430283e-05, -9.242631494998932e-05, -8.815992623567581e-05, -8.38935375213623e-05, -7.96271488070488e-05, -7.536076009273529e-05, -7.109437137842178e-05, -6.682798266410828e-05, -6.256159394979477e-05, -5.829520523548126e-05, -5.4028816521167755e-05, -4.976242780685425e-05, -4.549603909254074e-05, -4.1229650378227234e-05, -3.696326166391373e-05, -3.269687294960022e-05, -2.8430484235286713e-05, -2.4164095520973206e-05, -1.98977068066597e-05, -1.563131809234619e-05, -1.1364929378032684e-05, -7.098540663719177e-06, -2.83215194940567e-06, 1.434236764907837e-06, 5.700625479221344e-06, 9.967014193534851e-06, 1.4233402907848358e-05, 1.8499791622161865e-05, 2.2766180336475372e-05, 2.703256905078888e-05, 3.1298957765102386e-05, 3.5565346479415894e-05, 3.98317351937294e-05, 4.409812390804291e-05, 4.8364512622356415e-05, 5.263090133666992e-05]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 5.0, 5.0, 6.0, 7.0, 15.0, 29.0, 40.0, 37.0, 71.0, 141.0, 228.0, 411.0, 927.0, 1929.0, 4934.0, 14739.0, 51005.0, 309238.0, 552162.0, 79421.0, 21338.0, 6967.0, 2581.0, 1089.0, 547.0, 271.0, 130.0, 103.0, 66.0, 35.0, 36.0, 17.0, 7.0, 5.0, 3.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0762939453125, -0.07384490966796875, -0.0713958740234375, -0.06894683837890625, -0.066497802734375, -0.06404876708984375, -0.0615997314453125, -0.05915069580078125, -0.05670166015625, -0.05425262451171875, -0.0518035888671875, -0.04935455322265625, -0.046905517578125, -0.04445648193359375, -0.0420074462890625, -0.03955841064453125, -0.037109375, -0.03466033935546875, -0.0322113037109375, -0.02976226806640625, -0.027313232421875, -0.02486419677734375, -0.0224151611328125, -0.01996612548828125, -0.01751708984375, -0.01506805419921875, -0.0126190185546875, -0.01016998291015625, -0.007720947265625, -0.00527191162109375, -0.0028228759765625, -0.00037384033203125, 0.0020751953125, 0.00452423095703125, 0.0069732666015625, 0.00942230224609375, 0.011871337890625, 0.01432037353515625, 0.0167694091796875, 0.01921844482421875, 0.02166748046875, 0.02411651611328125, 0.0265655517578125, 0.02901458740234375, 0.031463623046875, 0.03391265869140625, 0.0363616943359375, 0.03881072998046875, 0.041259765625, 0.04370880126953125, 0.0461578369140625, 0.04860687255859375, 0.051055908203125, 0.05350494384765625, 0.0559539794921875, 0.05840301513671875, 0.06085205078125, 0.06330108642578125, 0.0657501220703125, 0.06819915771484375, 0.070648193359375, 0.07309722900390625, 0.0755462646484375, 0.07799530029296875, 0.0804443359375]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 4.0, 1.0, 3.0, 3.0, 7.0, 9.0, 12.0, 10.0, 17.0, 26.0, 23.0, 52.0, 62.0, 80.0, 84.0, 108.0, 102.0, 89.0, 71.0, 57.0, 47.0, 25.0, 21.0, 25.0, 15.0, 10.0, 13.0, 6.0, 7.0, 4.0, 4.0, 3.0, 4.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07586669921875, -0.07362937927246094, -0.07139205932617188, -0.06915473937988281, -0.06691741943359375, -0.06468009948730469, -0.062442779541015625, -0.06020545959472656, -0.0579681396484375, -0.05573081970214844, -0.053493499755859375, -0.05125617980957031, -0.04901885986328125, -0.04678153991699219, -0.044544219970703125, -0.04230690002441406, -0.040069580078125, -0.03783226013183594, -0.035594940185546875, -0.03335762023925781, -0.03112030029296875, -0.028882980346679688, -0.026645660400390625, -0.024408340454101562, -0.0221710205078125, -0.019933700561523438, -0.017696380615234375, -0.015459060668945312, -0.01322174072265625, -0.010984420776367188, -0.008747100830078125, -0.0065097808837890625, -0.0042724609375, -0.0020351409912109375, 0.000202178955078125, 0.0024394989013671875, 0.00467681884765625, 0.0069141387939453125, 0.009151458740234375, 0.011388778686523438, 0.0136260986328125, 0.015863418579101562, 0.018100738525390625, 0.020338058471679688, 0.02257537841796875, 0.024812698364257812, 0.027050018310546875, 0.029287338256835938, 0.031524658203125, 0.03376197814941406, 0.035999298095703125, 0.03823661804199219, 0.04047393798828125, 0.04271125793457031, 0.044948577880859375, 0.04718589782714844, 0.0494232177734375, 0.05166053771972656, 0.053897857666015625, 0.05613517761230469, 0.05837249755859375, 0.06060981750488281, 0.06284713745117188, 0.06508445739746094, 0.06732177734375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 20.0, 54.0, 149.0, 318.0, 287.0, 129.0, 38.0, 8.0, 3.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.373222827911377, -4.260837078094482, -4.14845085144043, -4.036065101623535, -3.9236793518066406, -3.811293363571167, -3.6989073753356934, -3.586521625518799, -3.4741358757019043, -3.3617498874664307, -3.249364137649536, -3.1369781494140625, -3.024592399597168, -2.9122064113616943, -2.7998204231262207, -2.687434673309326, -2.5750486850738525, -2.462662696838379, -2.3502769470214844, -2.2378909587860107, -2.125505208969116, -2.0131192207336426, -1.9007333517074585, -1.7883474826812744, -1.6759616136550903, -1.5635757446289062, -1.4511898756027222, -1.338804006576538, -1.2264180183410645, -1.11403226852417, -1.0016462802886963, -0.8892604112625122, -0.7768745422363281, -0.664488673210144, -0.55210280418396, -0.4397168755531311, -0.327331006526947, -0.21494513750076294, -0.10255920886993408, 0.00982666015625, 0.12221252918243408, 0.23459841310977936, 0.34698429703712463, 0.4593701958656311, 0.5717560648918152, 0.6841419339179993, 0.7965278625488281, 0.9089137315750122, 1.0212996006011963, 1.1336854696273804, 1.2460713386535645, 1.358457326889038, 1.4708430767059326, 1.5832290649414062, 1.6956149339675903, 1.8080008029937744, 1.9203866720199585, 2.0327725410461426, 2.145158529281616, 2.2575442790985107, 2.3699302673339844, 2.482316017150879, 2.5947020053863525, 2.707087993621826, 2.8194737434387207]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 7.0, 3.0, 1.0, 12.0, 4.0, 10.0, 8.0, 8.0, 14.0, 15.0, 18.0, 21.0, 27.0, 36.0, 23.0, 30.0, 26.0, 38.0, 45.0, 33.0, 50.0, 44.0, 45.0, 44.0, 50.0, 45.0, 40.0, 40.0, 42.0, 40.0, 25.0, 18.0, 24.0, 19.0, 15.0, 19.0, 11.0, 9.0, 13.0, 4.0, 4.0, 5.0, 4.0, 3.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.3927788734436035, -1.3483463525772095, -1.3039138317108154, -1.2594811916351318, -1.2150486707687378, -1.1706161499023438, -1.1261836290359497, -1.0817511081695557, -1.037318468093872, -0.992885947227478, -0.9484533667564392, -0.9040208458900452, -0.8595882654190063, -0.8151557445526123, -0.7707232236862183, -0.7262907028198242, -0.6818581819534302, -0.6374256610870361, -0.5929930806159973, -0.5485605597496033, -0.5041279792785645, -0.4596954584121704, -0.41526293754577637, -0.37083038687705994, -0.3263978362083435, -0.2819652855396271, -0.23753274977207184, -0.1931002140045166, -0.14866766333580017, -0.10423511266708374, -0.0598025918006897, -0.015370041131973267, 0.029062509536743164, 0.073495052754879, 0.11792759597301483, 0.16236013174057007, 0.2067926824092865, 0.25122523307800293, 0.295657753944397, 0.3400903046131134, 0.38452285528182983, 0.42895540595054626, 0.4733879566192627, 0.5178204774856567, 0.5622529983520508, 0.6066855788230896, 0.6511180996894836, 0.6955506801605225, 0.7399832010269165, 0.7844157218933105, 0.8288483023643494, 0.8732808232307434, 0.9177134037017822, 0.9621459245681763, 1.0065784454345703, 1.0510109663009644, 1.0954434871673584, 1.1398760080337524, 1.1843085289001465, 1.22874116897583, 1.2731736898422241, 1.3176062107086182, 1.3620387315750122, 1.4064712524414062, 1.4509038925170898]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 10.0, 8.0, 14.0, 7.0, 13.0, 22.0, 26.0, 65.0, 98.0, 166.0, 343.0, 592.0, 1334.0, 3523.0, 14892.0, 200875.0, 3921950.0, 39910.0, 6636.0, 2021.0, 808.0, 378.0, 221.0, 142.0, 77.0, 51.0, 29.0, 22.0, 13.0, 7.0, 6.0, 5.0, 10.0, 0.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0], "bins": [-0.61767578125, -0.5990982055664062, -0.5805206298828125, -0.5619430541992188, -0.543365478515625, -0.5247879028320312, -0.5062103271484375, -0.48763275146484375, -0.46905517578125, -0.45047760009765625, -0.4319000244140625, -0.41332244873046875, -0.394744873046875, -0.37616729736328125, -0.3575897216796875, -0.33901214599609375, -0.3204345703125, -0.30185699462890625, -0.2832794189453125, -0.26470184326171875, -0.246124267578125, -0.22754669189453125, -0.2089691162109375, -0.19039154052734375, -0.17181396484375, -0.15323638916015625, -0.1346588134765625, -0.11608123779296875, -0.097503662109375, -0.07892608642578125, -0.0603485107421875, -0.04177093505859375, -0.023193359375, -0.00461578369140625, 0.0139617919921875, 0.03253936767578125, 0.051116943359375, 0.06969451904296875, 0.0882720947265625, 0.10684967041015625, 0.12542724609375, 0.14400482177734375, 0.1625823974609375, 0.18115997314453125, 0.199737548828125, 0.21831512451171875, 0.2368927001953125, 0.25547027587890625, 0.2740478515625, 0.29262542724609375, 0.3112030029296875, 0.32978057861328125, 0.348358154296875, 0.36693572998046875, 0.3855133056640625, 0.40409088134765625, 0.42266845703125, 0.44124603271484375, 0.4598236083984375, 0.47840118408203125, 0.496978759765625, 0.5155563354492188, 0.5341339111328125, 0.5527114868164062, 0.5712890625]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 4.0, 10.0, 11.0, 10.0, 22.0, 37.0, 44.0, 72.0, 90.0, 97.0, 96.0, 119.0, 91.0, 77.0, 66.0, 46.0, 33.0, 25.0, 12.0, 10.0, 14.0, 3.0, 7.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1414794921875, -0.13582229614257812, -0.13016510009765625, -0.12450790405273438, -0.1188507080078125, -0.11319351196289062, -0.10753631591796875, -0.10187911987304688, -0.096221923828125, -0.09056472778320312, -0.08490753173828125, -0.07925033569335938, -0.0735931396484375, -0.06793594360351562, -0.06227874755859375, -0.056621551513671875, -0.05096435546875, -0.045307159423828125, -0.03964996337890625, -0.033992767333984375, -0.0283355712890625, -0.022678375244140625, -0.01702117919921875, -0.011363983154296875, -0.005706787109375, -4.9591064453125e-05, 0.00560760498046875, 0.011264801025390625, 0.0169219970703125, 0.022579193115234375, 0.02823638916015625, 0.033893585205078125, 0.03955078125, 0.045207977294921875, 0.05086517333984375, 0.056522369384765625, 0.0621795654296875, 0.06783676147460938, 0.07349395751953125, 0.07915115356445312, 0.084808349609375, 0.09046554565429688, 0.09612274169921875, 0.10177993774414062, 0.1074371337890625, 0.11309432983398438, 0.11875152587890625, 0.12440872192382812, 0.13006591796875, 0.13572311401367188, 0.14138031005859375, 0.14703750610351562, 0.1526947021484375, 0.15835189819335938, 0.16400909423828125, 0.16966629028320312, 0.175323486328125, 0.18098068237304688, 0.18663787841796875, 0.19229507446289062, 0.1979522705078125, 0.20360946655273438, 0.20926666259765625, 0.21492385864257812, 0.2205810546875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 5.0, 10.0, 9.0, 15.0, 42.0, 88.0, 104.0, 209.0, 396.0, 713.0, 1360.0, 3118.0, 8207.0, 32173.0, 352408.0, 3678585.0, 91251.0, 16228.0, 5066.0, 2064.0, 1000.0, 565.0, 310.0, 138.0, 108.0, 45.0, 27.0, 23.0, 15.0, 4.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.359619140625, -0.3497047424316406, -0.33979034423828125, -0.3298759460449219, -0.3199615478515625, -0.3100471496582031, -0.30013275146484375, -0.2902183532714844, -0.280303955078125, -0.2703895568847656, -0.26047515869140625, -0.2505607604980469, -0.2406463623046875, -0.23073196411132812, -0.22081756591796875, -0.21090316772460938, -0.20098876953125, -0.19107437133789062, -0.18115997314453125, -0.17124557495117188, -0.1613311767578125, -0.15141677856445312, -0.14150238037109375, -0.13158798217773438, -0.121673583984375, -0.11175918579101562, -0.10184478759765625, -0.09193038940429688, -0.0820159912109375, -0.07210159301757812, -0.06218719482421875, -0.052272796630859375, -0.0423583984375, -0.032444000244140625, -0.02252960205078125, -0.012615203857421875, -0.0027008056640625, 0.007213592529296875, 0.01712799072265625, 0.027042388916015625, 0.036956787109375, 0.046871185302734375, 0.05678558349609375, 0.06669998168945312, 0.0766143798828125, 0.08652877807617188, 0.09644317626953125, 0.10635757446289062, 0.11627197265625, 0.12618637084960938, 0.13610076904296875, 0.14601516723632812, 0.1559295654296875, 0.16584396362304688, 0.17575836181640625, 0.18567276000976562, 0.195587158203125, 0.20550155639648438, 0.21541595458984375, 0.22533035278320312, 0.2352447509765625, 0.24515914916992188, 0.25507354736328125, 0.2649879455566406, 0.27490234375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 5.0, 1.0, 6.0, 9.0, 16.0, 22.0, 35.0, 70.0, 137.0, 526.0, 2500.0, 461.0, 132.0, 45.0, 37.0, 16.0, 15.0, 14.0, 6.0, 6.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1417236328125, -0.13691329956054688, -0.13210296630859375, -0.12729263305664062, -0.1224822998046875, -0.11767196655273438, -0.11286163330078125, -0.10805130004882812, -0.103240966796875, -0.09843063354492188, -0.09362030029296875, -0.08880996704101562, -0.0839996337890625, -0.07918930053710938, -0.07437896728515625, -0.06956863403320312, -0.06475830078125, -0.059947967529296875, -0.05513763427734375, -0.050327301025390625, -0.0455169677734375, -0.040706634521484375, -0.03589630126953125, -0.031085968017578125, -0.026275634765625, -0.021465301513671875, -0.01665496826171875, -0.011844635009765625, -0.0070343017578125, -0.002223968505859375, 0.00258636474609375, 0.007396697998046875, 0.01220703125, 0.017017364501953125, 0.02182769775390625, 0.026638031005859375, 0.0314483642578125, 0.036258697509765625, 0.04106903076171875, 0.045879364013671875, 0.050689697265625, 0.055500030517578125, 0.06031036376953125, 0.06512069702148438, 0.0699310302734375, 0.07474136352539062, 0.07955169677734375, 0.08436203002929688, 0.08917236328125, 0.09398269653320312, 0.09879302978515625, 0.10360336303710938, 0.1084136962890625, 0.11322402954101562, 0.11803436279296875, 0.12284469604492188, 0.127655029296875, 0.13246536254882812, 0.13727569580078125, 0.14208602905273438, 0.1468963623046875, 0.15170669555664062, 0.15651702880859375, 0.16132736206054688, 0.1661376953125]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 7.0, 1.0, 6.0, 10.0, 13.0, 33.0, 43.0, 73.0, 131.0, 158.0, 164.0, 149.0, 93.0, 65.0, 29.0, 14.0, 6.0, 7.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5560423731803894, -0.5384963154792786, -0.5209503173828125, -0.5034042596817017, -0.4858582317829132, -0.46831220388412476, -0.4507661461830139, -0.43322011828422546, -0.415674090385437, -0.39812806248664856, -0.3805820345878601, -0.36303597688674927, -0.3454899489879608, -0.32794392108917236, -0.3103978633880615, -0.29285183548927307, -0.2753058075904846, -0.25775977969169617, -0.24021373689174652, -0.22266769409179688, -0.20512166619300842, -0.18757563829421997, -0.17002959549427032, -0.15248355269432068, -0.13493752479553223, -0.11739148944616318, -0.09984545409679413, -0.08229941874742508, -0.06475338339805603, -0.04720734804868698, -0.029661312699317932, -0.012115277349948883, 0.005430698394775391, 0.02297673374414444, 0.04052276909351349, 0.05806880444288254, 0.07561483979225159, 0.09316087514162064, 0.11070691049098969, 0.12825295329093933, 0.14579898118972778, 0.16334500908851624, 0.18089105188846588, 0.19843709468841553, 0.21598312258720398, 0.23352915048599243, 0.25107520818710327, 0.2686212360858917, 0.2861672639846802, 0.30371329188346863, 0.3212593197822571, 0.3388053774833679, 0.35635140538215637, 0.3738974332809448, 0.39144349098205566, 0.4089895188808441, 0.42653554677963257, 0.444081574678421, 0.4616276025772095, 0.4791736602783203, 0.49671968817710876, 0.5142657160758972, 0.5318117737770081, 0.5493577718734741, 0.566903829574585]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 5.0, 16.0, 19.0, 16.0, 18.0, 23.0, 25.0, 32.0, 37.0, 45.0, 51.0, 45.0, 60.0, 57.0, 63.0, 63.0, 57.0, 70.0, 50.0, 44.0, 40.0, 31.0, 24.0, 31.0, 18.0, 11.0, 6.0, 16.0, 9.0, 5.0, 4.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.48112577199935913, -0.46922507882118225, -0.457324355840683, -0.4454236626625061, -0.43352293968200684, -0.42162224650382996, -0.4097215235233307, -0.3978208303451538, -0.38592010736465454, -0.37401941418647766, -0.3621186912059784, -0.3502179980278015, -0.33831727504730225, -0.32641658186912537, -0.3145158588886261, -0.3026151657104492, -0.29071444272994995, -0.27881374955177307, -0.2669130265712738, -0.2550123333930969, -0.24311161041259766, -0.23121090233325958, -0.2193101942539215, -0.20740950107574463, -0.19550880789756775, -0.18360809981822968, -0.1717073917388916, -0.15980668365955353, -0.14790597558021545, -0.13600526750087738, -0.1241045668721199, -0.11220385879278183, -0.10030314326286316, -0.08840243518352509, -0.07650172710418701, -0.06460101902484894, -0.05270031467080116, -0.04079960659146309, -0.028898902237415314, -0.01699819415807724, -0.005097486078739166, 0.006803221069276333, 0.018703928217291832, 0.030604634433984756, 0.04250534251332283, 0.054406050592660904, 0.06630675494670868, 0.07820746302604675, 0.09010817110538483, 0.1020088791847229, 0.11390958726406097, 0.12581029534339905, 0.13771100342273712, 0.1496117115020752, 0.16151240468025208, 0.17341312766075134, 0.18531382083892822, 0.1972145289182663, 0.20911523699760437, 0.22101594507694244, 0.23291665315628052, 0.2448173612356186, 0.25671806931495667, 0.26861876249313354, 0.2805194854736328]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 1.0, 4.0, 8.0, 15.0, 19.0, 20.0, 49.0, 77.0, 119.0, 262.0, 480.0, 1058.0, 2959.0, 11111.0, 73832.0, 674723.0, 250223.0, 25131.0, 5346.0, 1657.0, 726.0, 327.0, 158.0, 92.0, 62.0, 28.0, 22.0, 14.0, 12.0, 3.0, 6.0, 4.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.662109375, -0.6430511474609375, -0.623992919921875, -0.6049346923828125, -0.58587646484375, -0.5668182373046875, -0.547760009765625, -0.5287017822265625, -0.5096435546875, -0.4905853271484375, -0.471527099609375, -0.4524688720703125, -0.43341064453125, -0.4143524169921875, -0.395294189453125, -0.3762359619140625, -0.357177734375, -0.3381195068359375, -0.319061279296875, -0.3000030517578125, -0.28094482421875, -0.2618865966796875, -0.242828369140625, -0.2237701416015625, -0.2047119140625, -0.1856536865234375, -0.166595458984375, -0.1475372314453125, -0.12847900390625, -0.1094207763671875, -0.090362548828125, -0.0713043212890625, -0.05224609375, -0.0331878662109375, -0.014129638671875, 0.0049285888671875, 0.02398681640625, 0.0430450439453125, 0.062103271484375, 0.0811614990234375, 0.1002197265625, 0.1192779541015625, 0.138336181640625, 0.1573944091796875, 0.17645263671875, 0.1955108642578125, 0.214569091796875, 0.2336273193359375, 0.252685546875, 0.2717437744140625, 0.290802001953125, 0.3098602294921875, 0.32891845703125, 0.3479766845703125, 0.367034912109375, 0.3860931396484375, 0.4051513671875, 0.4242095947265625, 0.443267822265625, 0.4623260498046875, 0.48138427734375, 0.5004425048828125, 0.519500732421875, 0.5385589599609375, 0.5576171875]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 4.0, 2.0, 5.0, 12.0, 13.0, 17.0, 28.0, 43.0, 63.0, 102.0, 95.0, 101.0, 127.0, 104.0, 75.0, 63.0, 51.0, 32.0, 22.0, 19.0, 6.0, 12.0, 5.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1619873046875, -0.1560192108154297, -0.15005111694335938, -0.14408302307128906, -0.13811492919921875, -0.13214683532714844, -0.12617874145507812, -0.12021064758300781, -0.1142425537109375, -0.10827445983886719, -0.10230636596679688, -0.09633827209472656, -0.09037017822265625, -0.08440208435058594, -0.07843399047851562, -0.07246589660644531, -0.066497802734375, -0.06052970886230469, -0.054561614990234375, -0.04859352111816406, -0.04262542724609375, -0.03665733337402344, -0.030689239501953125, -0.024721145629882812, -0.0187530517578125, -0.012784957885742188, -0.006816864013671875, -0.0008487701416015625, 0.00511932373046875, 0.011087417602539062, 0.017055511474609375, 0.023023605346679688, 0.02899169921875, 0.03495979309082031, 0.040927886962890625, 0.04689598083496094, 0.05286407470703125, 0.05883216857910156, 0.06480026245117188, 0.07076835632324219, 0.0767364501953125, 0.08270454406738281, 0.08867263793945312, 0.09464073181152344, 0.10060882568359375, 0.10657691955566406, 0.11254501342773438, 0.11851310729980469, 0.124481201171875, 0.1304492950439453, 0.13641738891601562, 0.14238548278808594, 0.14835357666015625, 0.15432167053222656, 0.16028976440429688, 0.1662578582763672, 0.1722259521484375, 0.1781940460205078, 0.18416213989257812, 0.19013023376464844, 0.19609832763671875, 0.20206642150878906, 0.20803451538085938, 0.2140026092529297, 0.219970703125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 4.0, 10.0, 3.0, 18.0, 20.0, 18.0, 41.0, 45.0, 97.0, 145.0, 311.0, 587.0, 1266.0, 3497.0, 10719.0, 42070.0, 226977.0, 574208.0, 147034.0, 28707.0, 7993.0, 2644.0, 1058.0, 501.0, 209.0, 135.0, 81.0, 62.0, 33.0, 17.0, 10.0, 16.0, 4.0, 6.0, 4.0, 1.0, 6.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33447265625, -0.3241424560546875, -0.313812255859375, -0.3034820556640625, -0.29315185546875, -0.2828216552734375, -0.272491455078125, -0.2621612548828125, -0.2518310546875, -0.2415008544921875, -0.231170654296875, -0.2208404541015625, -0.21051025390625, -0.2001800537109375, -0.189849853515625, -0.1795196533203125, -0.169189453125, -0.1588592529296875, -0.148529052734375, -0.1381988525390625, -0.12786865234375, -0.1175384521484375, -0.107208251953125, -0.0968780517578125, -0.0865478515625, -0.0762176513671875, -0.065887451171875, -0.0555572509765625, -0.04522705078125, -0.0348968505859375, -0.024566650390625, -0.0142364501953125, -0.00390625, 0.0064239501953125, 0.016754150390625, 0.0270843505859375, 0.03741455078125, 0.0477447509765625, 0.058074951171875, 0.0684051513671875, 0.0787353515625, 0.0890655517578125, 0.099395751953125, 0.1097259521484375, 0.12005615234375, 0.1303863525390625, 0.140716552734375, 0.1510467529296875, 0.161376953125, 0.1717071533203125, 0.182037353515625, 0.1923675537109375, 0.20269775390625, 0.2130279541015625, 0.223358154296875, 0.2336883544921875, 0.2440185546875, 0.2543487548828125, 0.264678955078125, 0.2750091552734375, 0.28533935546875, 0.2956695556640625, 0.305999755859375, 0.3163299560546875, 0.32666015625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0, 6.0, 5.0, 7.0, 9.0, 10.0, 11.0, 17.0, 8.0, 22.0, 19.0, 24.0, 25.0, 25.0, 42.0, 50.0, 35.0, 50.0, 47.0, 47.0, 47.0, 52.0, 54.0, 45.0, 45.0, 42.0, 45.0, 34.0, 36.0, 25.0, 25.0, 12.0, 15.0, 13.0, 14.0, 5.0, 8.0, 8.0, 5.0, 3.0, 4.0, 5.0, 1.0, 3.0, 0.0, 3.0, 0.0, 4.0], "bins": [-0.475341796875, -0.46256256103515625, -0.4497833251953125, -0.43700408935546875, -0.424224853515625, -0.41144561767578125, -0.3986663818359375, -0.38588714599609375, -0.37310791015625, -0.36032867431640625, -0.3475494384765625, -0.33477020263671875, -0.321990966796875, -0.30921173095703125, -0.2964324951171875, -0.28365325927734375, -0.2708740234375, -0.25809478759765625, -0.2453155517578125, -0.23253631591796875, -0.219757080078125, -0.20697784423828125, -0.1941986083984375, -0.18141937255859375, -0.16864013671875, -0.15586090087890625, -0.1430816650390625, -0.13030242919921875, -0.117523193359375, -0.10474395751953125, -0.0919647216796875, -0.07918548583984375, -0.06640625, -0.05362701416015625, -0.0408477783203125, -0.02806854248046875, -0.015289306640625, -0.00251007080078125, 0.0102691650390625, 0.02304840087890625, 0.03582763671875, 0.04860687255859375, 0.0613861083984375, 0.07416534423828125, 0.086944580078125, 0.09972381591796875, 0.1125030517578125, 0.12528228759765625, 0.1380615234375, 0.15084075927734375, 0.1636199951171875, 0.17639923095703125, 0.189178466796875, 0.20195770263671875, 0.2147369384765625, 0.22751617431640625, 0.24029541015625, 0.25307464599609375, 0.2658538818359375, 0.27863311767578125, 0.291412353515625, 0.30419158935546875, 0.3169708251953125, 0.32975006103515625, 0.342529296875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 5.0, 8.0, 6.0, 14.0, 18.0, 36.0, 70.0, 149.0, 290.0, 783.0, 3063.0, 23872.0, 625264.0, 374216.0, 17049.0, 2454.0, 697.0, 279.0, 132.0, 69.0, 41.0, 14.0, 11.0, 7.0, 5.0, 3.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2373046875, -0.22910308837890625, -0.2209014892578125, -0.21269989013671875, -0.204498291015625, -0.19629669189453125, -0.1880950927734375, -0.17989349365234375, -0.17169189453125, -0.16349029541015625, -0.1552886962890625, -0.14708709716796875, -0.138885498046875, -0.13068389892578125, -0.1224822998046875, -0.11428070068359375, -0.1060791015625, -0.09787750244140625, -0.0896759033203125, -0.08147430419921875, -0.073272705078125, -0.06507110595703125, -0.0568695068359375, -0.04866790771484375, -0.04046630859375, -0.03226470947265625, -0.0240631103515625, -0.01586151123046875, -0.007659912109375, 0.00054168701171875, 0.0087432861328125, 0.01694488525390625, 0.025146484375, 0.03334808349609375, 0.0415496826171875, 0.04975128173828125, 0.057952880859375, 0.06615447998046875, 0.0743560791015625, 0.08255767822265625, 0.09075927734375, 0.09896087646484375, 0.1071624755859375, 0.11536407470703125, 0.123565673828125, 0.13176727294921875, 0.1399688720703125, 0.14817047119140625, 0.1563720703125, 0.16457366943359375, 0.1727752685546875, 0.18097686767578125, 0.189178466796875, 0.19738006591796875, 0.2055816650390625, 0.21378326416015625, 0.22198486328125, 0.23018646240234375, 0.2383880615234375, 0.24658966064453125, 0.254791259765625, 0.26299285888671875, 0.2711944580078125, 0.27939605712890625, 0.28759765625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 2.0, 6.0, 1.0, 15.0, 18.0, 12.0, 16.0, 39.0, 33.0, 46.0, 70.0, 125.0, 156.0, 138.0, 85.0, 60.0, 50.0, 38.0, 29.0, 18.0, 10.0, 10.0, 11.0, 8.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001074671745300293, -0.00010296422988176346, -9.846128523349762e-05, -9.395834058523178e-05, -8.945539593696594e-05, -8.49524512887001e-05, -8.044950664043427e-05, -7.594656199216843e-05, -7.144361734390259e-05, -6.694067269563675e-05, -6.243772804737091e-05, -5.793478339910507e-05, -5.3431838750839233e-05, -4.8928894102573395e-05, -4.4425949454307556e-05, -3.992300480604172e-05, -3.542006015777588e-05, -3.091711550951004e-05, -2.64141708612442e-05, -2.1911226212978363e-05, -1.7408281564712524e-05, -1.2905336916446686e-05, -8.402392268180847e-06, -3.8994476199150085e-06, 6.034970283508301e-07, 5.106441676616669e-06, 9.609386324882507e-06, 1.4112330973148346e-05, 1.8615275621414185e-05, 2.3118220269680023e-05, 2.7621164917945862e-05, 3.21241095662117e-05, 3.662705421447754e-05, 4.112999886274338e-05, 4.5632943511009216e-05, 5.0135888159275055e-05, 5.4638832807540894e-05, 5.914177745580673e-05, 6.364472210407257e-05, 6.814766675233841e-05, 7.265061140060425e-05, 7.715355604887009e-05, 8.165650069713593e-05, 8.615944534540176e-05, 9.06623899936676e-05, 9.516533464193344e-05, 9.966827929019928e-05, 0.00010417122393846512, 0.00010867416858673096, 0.0001131771132349968, 0.00011768005788326263, 0.00012218300253152847, 0.0001266859471797943, 0.00013118889182806015, 0.000135691836476326, 0.00014019478112459183, 0.00014469772577285767, 0.0001492006704211235, 0.00015370361506938934, 0.00015820655971765518, 0.00016270950436592102, 0.00016721244901418686, 0.0001717153936624527, 0.00017621833831071854, 0.00018072128295898438]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 10.0, 12.0, 17.0, 27.0, 31.0, 57.0, 92.0, 143.0, 282.0, 579.0, 1493.0, 5981.0, 43199.0, 553106.0, 403427.0, 32525.0, 4986.0, 1362.0, 536.0, 273.0, 143.0, 104.0, 57.0, 35.0, 27.0, 21.0, 11.0, 5.0, 1.0, 3.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2342529296875, -0.22754859924316406, -0.22084426879882812, -0.2141399383544922, -0.20743560791015625, -0.2007312774658203, -0.19402694702148438, -0.18732261657714844, -0.1806182861328125, -0.17391395568847656, -0.16720962524414062, -0.1605052947998047, -0.15380096435546875, -0.1470966339111328, -0.14039230346679688, -0.13368797302246094, -0.126983642578125, -0.12027931213378906, -0.11357498168945312, -0.10687065124511719, -0.10016632080078125, -0.09346199035644531, -0.08675765991210938, -0.08005332946777344, -0.0733489990234375, -0.06664466857910156, -0.059940338134765625, -0.05323600769042969, -0.04653167724609375, -0.03982734680175781, -0.033123016357421875, -0.026418685913085938, -0.01971435546875, -0.013010025024414062, -0.006305694580078125, 0.0003986358642578125, 0.00710296630859375, 0.013807296752929688, 0.020511627197265625, 0.027215957641601562, 0.0339202880859375, 0.04062461853027344, 0.047328948974609375, 0.05403327941894531, 0.06073760986328125, 0.06744194030761719, 0.07414627075195312, 0.08085060119628906, 0.087554931640625, 0.09425926208496094, 0.10096359252929688, 0.10766792297363281, 0.11437225341796875, 0.12107658386230469, 0.12778091430664062, 0.13448524475097656, 0.1411895751953125, 0.14789390563964844, 0.15459823608398438, 0.1613025665283203, 0.16800689697265625, 0.1747112274169922, 0.18141555786132812, 0.18811988830566406, 0.19482421875]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 6.0, 12.0, 15.0, 18.0, 25.0, 23.0, 70.0, 80.0, 96.0, 157.0, 160.0, 125.0, 56.0, 44.0, 45.0, 25.0, 20.0, 11.0, 8.0, 3.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10101318359375, -0.0947122573852539, -0.08841133117675781, -0.08211040496826172, -0.07580947875976562, -0.06950855255126953, -0.06320762634277344, -0.056906700134277344, -0.05060577392578125, -0.044304847717285156, -0.03800392150878906, -0.03170299530029297, -0.025402069091796875, -0.01910114288330078, -0.012800216674804688, -0.006499290466308594, -0.0001983642578125, 0.006102561950683594, 0.012403488159179688, 0.01870441436767578, 0.025005340576171875, 0.03130626678466797, 0.03760719299316406, 0.043908119201660156, 0.05020904541015625, 0.056509971618652344, 0.06281089782714844, 0.06911182403564453, 0.07541275024414062, 0.08171367645263672, 0.08801460266113281, 0.0943155288696289, 0.100616455078125, 0.1069173812866211, 0.11321830749511719, 0.11951923370361328, 0.12582015991210938, 0.13212108612060547, 0.13842201232910156, 0.14472293853759766, 0.15102386474609375, 0.15732479095458984, 0.16362571716308594, 0.16992664337158203, 0.17622756958007812, 0.18252849578857422, 0.1888294219970703, 0.1951303482055664, 0.2014312744140625, 0.2077322006225586, 0.2140331268310547, 0.22033405303955078, 0.22663497924804688, 0.23293590545654297, 0.23923683166503906, 0.24553775787353516, 0.25183868408203125, 0.25813961029052734, 0.26444053649902344, 0.27074146270751953, 0.2770423889160156, 0.2833433151245117, 0.2896442413330078, 0.2959451675415039, 0.30224609375]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 4.0, 6.0, 8.0, 17.0, 30.0, 65.0, 113.0, 183.0, 207.0, 191.0, 100.0, 52.0, 16.0, 12.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.8654857873916626, -1.7591750621795654, -1.6528642177581787, -1.5465534925460815, -1.4402427673339844, -1.3339320421218872, -1.22762131690979, -1.1213104724884033, -1.0149997472763062, -0.908689022064209, -0.802378237247467, -0.6960674524307251, -0.5897567272186279, -0.48344600200653076, -0.3771352171897888, -0.2708244323730469, -0.1645137071609497, -0.05820295214653015, 0.048107802867889404, 0.15441855788230896, 0.2607293128967285, 0.3670400381088257, 0.4733508229255676, 0.5796616077423096, 0.6859723329544067, 0.7922830581665039, 0.8985938429832458, 1.0049046277999878, 1.111215353012085, 1.2175260782241821, 1.3238368034362793, 1.430147647857666, 1.5364584922790527, 1.64276921749115, 1.749079942703247, 1.8553907871246338, 1.961701512336731, 2.068012237548828, 2.174323081970215, 2.2806339263916016, 2.386944532394409, 2.493255376815796, 2.5995659828186035, 2.7058768272399902, 2.812187671661377, 2.9184982776641846, 3.0248091220855713, 3.131119728088379, 3.2374305725097656, 3.3437414169311523, 3.45005202293396, 3.5563628673553467, 3.6626734733581543, 3.768984317779541, 3.8752951622009277, 3.9816060066223145, 4.087916374206543, 4.19422721862793, 4.300538063049316, 4.406848430633545, 4.513159275054932, 4.619470119476318, 4.725780963897705, 4.832091808319092, 4.9384026527404785]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 7.0, 8.0, 11.0, 10.0, 13.0, 12.0, 17.0, 15.0, 23.0, 45.0, 35.0, 41.0, 27.0, 44.0, 43.0, 44.0, 47.0, 55.0, 35.0, 63.0, 51.0, 44.0, 41.0, 31.0, 25.0, 33.0, 32.0, 25.0, 20.0, 17.0, 21.0, 12.0, 12.0, 13.0, 7.0, 3.0, 10.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.0801477432250977, -2.0130786895751953, -1.9460097551345825, -1.8789407014846802, -1.8118717670440674, -1.744802713394165, -1.6777336597442627, -1.61066472530365, -1.543595790863037, -1.4765267372131348, -1.409457802772522, -1.3423887491226196, -1.2753198146820068, -1.2082507610321045, -1.1411817073822021, -1.0741127729415894, -1.007043719291687, -0.9399747252464294, -0.8729057312011719, -0.8058366775512695, -0.7387677431106567, -0.6716986894607544, -0.6046296954154968, -0.5375607013702393, -0.4704917073249817, -0.4034227132797241, -0.33635371923446655, -0.2692846953868866, -0.20221570134162903, -0.13514670729637146, -0.0680776834487915, -0.0010086894035339355, 0.06606030464172363, 0.1331292986869812, 0.20019830763339996, 0.2672673165798187, 0.3343363106250763, 0.40140530467033386, 0.4684743285179138, 0.5355433225631714, 0.602612316608429, 0.6696813106536865, 0.7367503046989441, 0.8038192987442017, 0.870888352394104, 0.9379572868347168, 1.0050263404846191, 1.0720953941345215, 1.1391643285751343, 1.2062333822250366, 1.2733023166656494, 1.3403713703155518, 1.4074403047561646, 1.474509358406067, 1.5415782928466797, 1.608647346496582, 1.6757164001464844, 1.7427854537963867, 1.8098543882369995, 1.8769234418869019, 1.9439923763275146, 2.011061429977417, 2.0781304836273193, 2.1451992988586426, 2.212268352508545]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 0.0, 3.0, 5.0, 2.0, 16.0, 10.0, 16.0, 35.0, 43.0, 62.0, 117.0, 164.0, 337.0, 655.0, 1555.0, 4455.0, 18955.0, 343510.0, 3771826.0, 41356.0, 7213.0, 2128.0, 876.0, 380.0, 218.0, 113.0, 87.0, 49.0, 37.0, 17.0, 11.0, 10.0, 10.0, 2.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.471923828125, -0.4539070129394531, -0.43589019775390625, -0.4178733825683594, -0.3998565673828125, -0.3818397521972656, -0.36382293701171875, -0.3458061218261719, -0.327789306640625, -0.3097724914550781, -0.29175567626953125, -0.2737388610839844, -0.2557220458984375, -0.23770523071289062, -0.21968841552734375, -0.20167160034179688, -0.18365478515625, -0.16563796997070312, -0.14762115478515625, -0.12960433959960938, -0.1115875244140625, -0.09357070922851562, -0.07555389404296875, -0.057537078857421875, -0.039520263671875, -0.021503448486328125, -0.00348663330078125, 0.014530181884765625, 0.0325469970703125, 0.050563812255859375, 0.06858062744140625, 0.08659744262695312, 0.1046142578125, 0.12263107299804688, 0.14064788818359375, 0.15866470336914062, 0.1766815185546875, 0.19469833374023438, 0.21271514892578125, 0.23073196411132812, 0.248748779296875, 0.2667655944824219, 0.28478240966796875, 0.3027992248535156, 0.3208160400390625, 0.3388328552246094, 0.35684967041015625, 0.3748664855957031, 0.39288330078125, 0.4109001159667969, 0.42891693115234375, 0.4469337463378906, 0.4649505615234375, 0.4829673767089844, 0.5009841918945312, 0.5190010070800781, 0.537017822265625, 0.5550346374511719, 0.5730514526367188, 0.5910682678222656, 0.6090850830078125, 0.6271018981933594, 0.6451187133789062, 0.6631355285644531, 0.68115234375]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 9.0, 5.0, 6.0, 18.0, 22.0, 25.0, 41.0, 63.0, 67.0, 92.0, 103.0, 81.0, 98.0, 84.0, 81.0, 61.0, 54.0, 28.0, 20.0, 15.0, 11.0, 6.0, 7.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1649169921875, -0.15894508361816406, -0.15297317504882812, -0.1470012664794922, -0.14102935791015625, -0.1350574493408203, -0.12908554077148438, -0.12311363220214844, -0.1171417236328125, -0.11116981506347656, -0.10519790649414062, -0.09922599792480469, -0.09325408935546875, -0.08728218078613281, -0.08131027221679688, -0.07533836364746094, -0.069366455078125, -0.06339454650878906, -0.057422637939453125, -0.05145072937011719, -0.04547882080078125, -0.03950691223144531, -0.033535003662109375, -0.027563095092773438, -0.0215911865234375, -0.015619277954101562, -0.009647369384765625, -0.0036754608154296875, 0.00229644775390625, 0.008268356323242188, 0.014240264892578125, 0.020212173461914062, 0.02618408203125, 0.03215599060058594, 0.038127899169921875, 0.04409980773925781, 0.05007171630859375, 0.05604362487792969, 0.062015533447265625, 0.06798744201660156, 0.0739593505859375, 0.07993125915527344, 0.08590316772460938, 0.09187507629394531, 0.09784698486328125, 0.10381889343261719, 0.10979080200195312, 0.11576271057128906, 0.121734619140625, 0.12770652770996094, 0.13367843627929688, 0.1396503448486328, 0.14562225341796875, 0.1515941619873047, 0.15756607055664062, 0.16353797912597656, 0.1695098876953125, 0.17548179626464844, 0.18145370483398438, 0.1874256134033203, 0.19339752197265625, 0.1993694305419922, 0.20534133911132812, 0.21131324768066406, 0.21728515625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 1.0, 2.0, 5.0, 4.0, 15.0, 8.0, 5.0, 16.0, 25.0, 28.0, 48.0, 61.0, 81.0, 130.0, 168.0, 267.0, 389.0, 596.0, 889.0, 1523.0, 2535.0, 4847.0, 9904.0, 25458.0, 90461.0, 868871.0, 2961743.0, 161409.0, 37395.0, 13252.0, 5915.0, 3165.0, 1760.0, 1069.0, 709.0, 449.0, 301.0, 232.0, 159.0, 131.0, 72.0, 46.0, 36.0, 33.0, 22.0, 17.0, 10.0, 6.0, 4.0, 3.0, 2.0, 3.0, 5.0, 4.0, 1.0], "bins": [-0.2296142578125, -0.2230854034423828, -0.21655654907226562, -0.21002769470214844, -0.20349884033203125, -0.19696998596191406, -0.19044113159179688, -0.1839122772216797, -0.1773834228515625, -0.1708545684814453, -0.16432571411132812, -0.15779685974121094, -0.15126800537109375, -0.14473915100097656, -0.13821029663085938, -0.1316814422607422, -0.125152587890625, -0.11862373352050781, -0.11209487915039062, -0.10556602478027344, -0.09903717041015625, -0.09250831604003906, -0.08597946166992188, -0.07945060729980469, -0.0729217529296875, -0.06639289855957031, -0.059864044189453125, -0.05333518981933594, -0.04680633544921875, -0.04027748107910156, -0.033748626708984375, -0.027219772338867188, -0.02069091796875, -0.014162063598632812, -0.007633209228515625, -0.0011043548583984375, 0.00542449951171875, 0.011953353881835938, 0.018482208251953125, 0.025011062622070312, 0.0315399169921875, 0.03806877136230469, 0.044597625732421875, 0.05112648010253906, 0.05765533447265625, 0.06418418884277344, 0.07071304321289062, 0.07724189758300781, 0.083770751953125, 0.09029960632324219, 0.09682846069335938, 0.10335731506347656, 0.10988616943359375, 0.11641502380371094, 0.12294387817382812, 0.1294727325439453, 0.1360015869140625, 0.1425304412841797, 0.14905929565429688, 0.15558815002441406, 0.16211700439453125, 0.16864585876464844, 0.17517471313476562, 0.1817035675048828, 0.188232421875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 2.0, 5.0, 3.0, 2.0, 3.0, 9.0, 8.0, 18.0, 16.0, 31.0, 52.0, 82.0, 211.0, 886.0, 2012.0, 380.0, 151.0, 79.0, 37.0, 24.0, 21.0, 8.0, 12.0, 7.0, 1.0, 5.0, 4.0, 4.0, 0.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1427001953125, -0.136810302734375, -0.13092041015625, -0.125030517578125, -0.119140625, -0.113250732421875, -0.10736083984375, -0.101470947265625, -0.0955810546875, -0.089691162109375, -0.08380126953125, -0.077911376953125, -0.072021484375, -0.066131591796875, -0.06024169921875, -0.054351806640625, -0.0484619140625, -0.042572021484375, -0.03668212890625, -0.030792236328125, -0.02490234375, -0.019012451171875, -0.01312255859375, -0.007232666015625, -0.0013427734375, 0.004547119140625, 0.01043701171875, 0.016326904296875, 0.022216796875, 0.028106689453125, 0.03399658203125, 0.039886474609375, 0.0457763671875, 0.051666259765625, 0.05755615234375, 0.063446044921875, 0.0693359375, 0.075225830078125, 0.08111572265625, 0.087005615234375, 0.0928955078125, 0.098785400390625, 0.10467529296875, 0.110565185546875, 0.116455078125, 0.122344970703125, 0.12823486328125, 0.134124755859375, 0.1400146484375, 0.145904541015625, 0.15179443359375, 0.157684326171875, 0.16357421875, 0.169464111328125, 0.17535400390625, 0.181243896484375, 0.1871337890625, 0.193023681640625, 0.19891357421875, 0.204803466796875, 0.210693359375, 0.216583251953125, 0.22247314453125, 0.228363037109375, 0.2342529296875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 5.0, 6.0, 6.0, 21.0, 39.0, 48.0, 99.0, 124.0, 162.0, 143.0, 116.0, 96.0, 43.0, 39.0, 19.0, 13.0, 8.0, 6.0, 4.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.5749846696853638, -0.5522289276123047, -0.5294732451438904, -0.5067175030708313, -0.4839617609977722, -0.4612060487270355, -0.43845033645629883, -0.41569459438323975, -0.39293888211250305, -0.37018316984176636, -0.3474274277687073, -0.3246717154979706, -0.3019160032272339, -0.2791602611541748, -0.2564045488834381, -0.23364882171154022, -0.21089309453964233, -0.18813736736774445, -0.16538164019584656, -0.14262592792510986, -0.11987020075321198, -0.09711447358131409, -0.07435876131057739, -0.051603034138679504, -0.028847306966781616, -0.0060915835201740265, 0.016664139926433563, 0.039419859647750854, 0.06217558681964874, 0.08493131399154663, 0.10768702626228333, 0.1304427534341812, 0.15319854021072388, 0.17595426738262177, 0.19870999455451965, 0.22146570682525635, 0.24422143399715424, 0.2669771611690521, 0.2897328734397888, 0.3124886155128479, 0.3352443277835846, 0.3580000400543213, 0.38075578212738037, 0.40351149439811707, 0.42626720666885376, 0.44902294874191284, 0.47177866101264954, 0.49453437328338623, 0.5172901153564453, 0.5400458574295044, 0.5628015398979187, 0.5855572819709778, 0.6083130240440369, 0.6310687065124512, 0.6538244485855103, 0.6765801906585693, 0.6993359327316284, 0.7220916748046875, 0.7448473572731018, 0.7676030993461609, 0.79035884141922, 0.8131145238876343, 0.8358702659606934, 0.8586260080337524, 0.8813816905021667]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 2.0, 1.0, 3.0, 4.0, 9.0, 10.0, 12.0, 16.0, 25.0, 22.0, 27.0, 35.0, 31.0, 35.0, 45.0, 36.0, 52.0, 54.0, 48.0, 61.0, 44.0, 43.0, 51.0, 49.0, 39.0, 46.0, 41.0, 29.0, 24.0, 23.0, 20.0, 14.0, 8.0, 14.0, 7.0, 6.0, 6.0, 5.0, 6.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.5550470948219299, -0.5390156507492065, -0.5229842662811279, -0.5069528222084045, -0.49092140793800354, -0.47488999366760254, -0.45885854959487915, -0.44282713532447815, -0.42679572105407715, -0.41076430678367615, -0.39473289251327515, -0.37870144844055176, -0.36267003417015076, -0.34663861989974976, -0.33060717582702637, -0.31457576155662537, -0.29854434728622437, -0.28251293301582336, -0.26648151874542236, -0.250450074672699, -0.23441866040229797, -0.21838724613189697, -0.20235581696033478, -0.18632438778877258, -0.17029297351837158, -0.15426155924797058, -0.1382301300764084, -0.12219870835542679, -0.10616728663444519, -0.09013586491346359, -0.074104443192482, -0.0580730214715004, -0.0420415997505188, -0.0260101780295372, -0.009978756308555603, 0.006052665412425995, 0.022084087133407593, 0.03811550885438919, 0.05414693057537079, 0.07017835229635239, 0.08620977401733398, 0.10224119573831558, 0.11827261745929718, 0.13430404663085938, 0.15033546090126038, 0.16636687517166138, 0.18239830434322357, 0.19842973351478577, 0.21446114778518677, 0.23049256205558777, 0.24652399122714996, 0.26255542039871216, 0.27858683466911316, 0.29461824893951416, 0.31064969301223755, 0.32668110728263855, 0.34271252155303955, 0.35874393582344055, 0.37477535009384155, 0.39080679416656494, 0.40683820843696594, 0.42286962270736694, 0.43890106678009033, 0.45493248105049133, 0.47096389532089233]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 3.0, 3.0, 1.0, 4.0, 7.0, 1.0, 5.0, 9.0, 14.0, 21.0, 27.0, 30.0, 43.0, 74.0, 112.0, 192.0, 313.0, 552.0, 1063.0, 2232.0, 5528.0, 16864.0, 71210.0, 354578.0, 454776.0, 105481.0, 22932.0, 6925.0, 2670.0, 1272.0, 640.0, 349.0, 214.0, 138.0, 80.0, 55.0, 46.0, 28.0, 19.0, 13.0, 12.0, 10.0, 6.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.34716796875, -0.3343658447265625, -0.321563720703125, -0.3087615966796875, -0.29595947265625, -0.2831573486328125, -0.270355224609375, -0.2575531005859375, -0.2447509765625, -0.2319488525390625, -0.219146728515625, -0.2063446044921875, -0.19354248046875, -0.1807403564453125, -0.167938232421875, -0.1551361083984375, -0.142333984375, -0.1295318603515625, -0.116729736328125, -0.1039276123046875, -0.09112548828125, -0.0783233642578125, -0.065521240234375, -0.0527191162109375, -0.0399169921875, -0.0271148681640625, -0.014312744140625, -0.0015106201171875, 0.01129150390625, 0.0240936279296875, 0.036895751953125, 0.0496978759765625, 0.0625, 0.0753021240234375, 0.088104248046875, 0.1009063720703125, 0.11370849609375, 0.1265106201171875, 0.139312744140625, 0.1521148681640625, 0.1649169921875, 0.1777191162109375, 0.190521240234375, 0.2033233642578125, 0.21612548828125, 0.2289276123046875, 0.241729736328125, 0.2545318603515625, 0.267333984375, 0.2801361083984375, 0.292938232421875, 0.3057403564453125, 0.31854248046875, 0.3313446044921875, 0.344146728515625, 0.3569488525390625, 0.3697509765625, 0.3825531005859375, 0.395355224609375, 0.4081573486328125, 0.42095947265625, 0.4337615966796875, 0.446563720703125, 0.4593658447265625, 0.47216796875]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 7.0, 8.0, 10.0, 14.0, 28.0, 36.0, 42.0, 74.0, 97.0, 82.0, 93.0, 106.0, 91.0, 81.0, 68.0, 50.0, 40.0, 26.0, 18.0, 9.0, 8.0, 4.0, 5.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1650390625, -0.15892410278320312, -0.15280914306640625, -0.14669418334960938, -0.1405792236328125, -0.13446426391601562, -0.12834930419921875, -0.12223434448242188, -0.116119384765625, -0.11000442504882812, -0.10388946533203125, -0.09777450561523438, -0.0916595458984375, -0.08554458618164062, -0.07942962646484375, -0.07331466674804688, -0.06719970703125, -0.061084747314453125, -0.05496978759765625, -0.048854827880859375, -0.0427398681640625, -0.036624908447265625, -0.03050994873046875, -0.024394989013671875, -0.018280029296875, -0.012165069580078125, -0.00605010986328125, 6.4849853515625e-05, 0.0061798095703125, 0.012294769287109375, 0.01840972900390625, 0.024524688720703125, 0.0306396484375, 0.036754608154296875, 0.04286956787109375, 0.048984527587890625, 0.0550994873046875, 0.061214447021484375, 0.06732940673828125, 0.07344436645507812, 0.079559326171875, 0.08567428588867188, 0.09178924560546875, 0.09790420532226562, 0.1040191650390625, 0.11013412475585938, 0.11624908447265625, 0.12236404418945312, 0.12847900390625, 0.13459396362304688, 0.14070892333984375, 0.14682388305664062, 0.1529388427734375, 0.15905380249023438, 0.16516876220703125, 0.17128372192382812, 0.177398681640625, 0.18351364135742188, 0.18962860107421875, 0.19574356079101562, 0.2018585205078125, 0.20797348022460938, 0.21408843994140625, 0.22020339965820312, 0.226318359375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 6.0, 1.0, 6.0, 6.0, 5.0, 19.0, 13.0, 36.0, 72.0, 110.0, 225.0, 499.0, 1158.0, 4515.0, 30682.0, 418591.0, 544609.0, 40099.0, 5468.0, 1361.0, 520.0, 258.0, 125.0, 74.0, 39.0, 26.0, 13.0, 6.0, 5.0, 7.0, 4.0, 4.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6708984375, -0.650604248046875, -0.63031005859375, -0.610015869140625, -0.5897216796875, -0.569427490234375, -0.54913330078125, -0.528839111328125, -0.508544921875, -0.488250732421875, -0.46795654296875, -0.447662353515625, -0.4273681640625, -0.407073974609375, -0.38677978515625, -0.366485595703125, -0.34619140625, -0.325897216796875, -0.30560302734375, -0.285308837890625, -0.2650146484375, -0.244720458984375, -0.22442626953125, -0.204132080078125, -0.183837890625, -0.163543701171875, -0.14324951171875, -0.122955322265625, -0.1026611328125, -0.082366943359375, -0.06207275390625, -0.041778564453125, -0.021484375, -0.001190185546875, 0.01910400390625, 0.039398193359375, 0.0596923828125, 0.079986572265625, 0.10028076171875, 0.120574951171875, 0.140869140625, 0.161163330078125, 0.18145751953125, 0.201751708984375, 0.2220458984375, 0.242340087890625, 0.26263427734375, 0.282928466796875, 0.30322265625, 0.323516845703125, 0.34381103515625, 0.364105224609375, 0.3843994140625, 0.404693603515625, 0.42498779296875, 0.445281982421875, 0.465576171875, 0.485870361328125, 0.50616455078125, 0.526458740234375, 0.5467529296875, 0.567047119140625, 0.58734130859375, 0.607635498046875, 0.6279296875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 5.0, 8.0, 13.0, 8.0, 15.0, 14.0, 16.0, 30.0, 38.0, 51.0, 51.0, 54.0, 52.0, 59.0, 59.0, 53.0, 64.0, 52.0, 68.0, 50.0, 42.0, 34.0, 36.0, 38.0, 23.0, 12.0, 14.0, 14.0, 9.0, 11.0, 3.0, 5.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.68896484375, -0.6678695678710938, -0.6467742919921875, -0.6256790161132812, -0.604583740234375, -0.5834884643554688, -0.5623931884765625, -0.5412979125976562, -0.52020263671875, -0.49910736083984375, -0.4780120849609375, -0.45691680908203125, -0.435821533203125, -0.41472625732421875, -0.3936309814453125, -0.37253570556640625, -0.3514404296875, -0.33034515380859375, -0.3092498779296875, -0.28815460205078125, -0.267059326171875, -0.24596405029296875, -0.2248687744140625, -0.20377349853515625, -0.18267822265625, -0.16158294677734375, -0.1404876708984375, -0.11939239501953125, -0.098297119140625, -0.07720184326171875, -0.0561065673828125, -0.03501129150390625, -0.013916015625, 0.00717926025390625, 0.0282745361328125, 0.04936981201171875, 0.070465087890625, 0.09156036376953125, 0.1126556396484375, 0.13375091552734375, 0.15484619140625, 0.17594146728515625, 0.1970367431640625, 0.21813201904296875, 0.239227294921875, 0.26032257080078125, 0.2814178466796875, 0.30251312255859375, 0.3236083984375, 0.34470367431640625, 0.3657989501953125, 0.38689422607421875, 0.407989501953125, 0.42908477783203125, 0.4501800537109375, 0.47127532958984375, 0.49237060546875, 0.5134658813476562, 0.5345611572265625, 0.5556564331054688, 0.576751708984375, 0.5978469848632812, 0.6189422607421875, 0.6400375366210938, 0.6611328125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 6.0, 1.0, 4.0, 11.0, 13.0, 21.0, 30.0, 32.0, 69.0, 122.0, 205.0, 409.0, 978.0, 2645.0, 9077.0, 53657.0, 580858.0, 358291.0, 31989.0, 6519.0, 2014.0, 795.0, 356.0, 188.0, 96.0, 58.0, 36.0, 18.0, 25.0, 16.0, 11.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1993408203125, -0.19243812561035156, -0.18553543090820312, -0.1786327362060547, -0.17173004150390625, -0.1648273468017578, -0.15792465209960938, -0.15102195739746094, -0.1441192626953125, -0.13721656799316406, -0.13031387329101562, -0.12341117858886719, -0.11650848388671875, -0.10960578918457031, -0.10270309448242188, -0.09580039978027344, -0.088897705078125, -0.08199501037597656, -0.07509231567382812, -0.06818962097167969, -0.06128692626953125, -0.05438423156738281, -0.047481536865234375, -0.04057884216308594, -0.0336761474609375, -0.026773452758789062, -0.019870758056640625, -0.012968063354492188, -0.00606536865234375, 0.0008373260498046875, 0.007740020751953125, 0.014642715454101562, 0.02154541015625, 0.028448104858398438, 0.035350799560546875, 0.04225349426269531, 0.04915618896484375, 0.05605888366699219, 0.06296157836914062, 0.06986427307128906, 0.0767669677734375, 0.08366966247558594, 0.09057235717773438, 0.09747505187988281, 0.10437774658203125, 0.11128044128417969, 0.11818313598632812, 0.12508583068847656, 0.131988525390625, 0.13889122009277344, 0.14579391479492188, 0.1526966094970703, 0.15959930419921875, 0.1665019989013672, 0.17340469360351562, 0.18030738830566406, 0.1872100830078125, 0.19411277770996094, 0.20101547241210938, 0.2079181671142578, 0.21482086181640625, 0.2217235565185547, 0.22862625122070312, 0.23552894592285156, 0.242431640625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 9.0, 8.0, 21.0, 27.0, 44.0, 74.0, 131.0, 167.0, 181.0, 121.0, 79.0, 46.0, 32.0, 22.0, 14.0, 10.0, 6.0, 3.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000255584716796875, -0.00024810247123241425, -0.0002406202256679535, -0.00023313798010349274, -0.00022565573453903198, -0.00021817348897457123, -0.00021069124341011047, -0.00020320899784564972, -0.00019572675228118896, -0.0001882445067167282, -0.00018076226115226746, -0.0001732800155878067, -0.00016579777002334595, -0.0001583155244588852, -0.00015083327889442444, -0.00014335103332996368, -0.00013586878776550293, -0.00012838654220104218, -0.00012090429663658142, -0.00011342205107212067, -0.00010593980550765991, -9.845755994319916e-05, -9.09753143787384e-05, -8.349306881427765e-05, -7.60108232498169e-05, -6.852857768535614e-05, -6.104633212089539e-05, -5.356408655643463e-05, -4.608184099197388e-05, -3.859959542751312e-05, -3.111734986305237e-05, -2.3635104298591614e-05, -1.615285873413086e-05, -8.670613169670105e-06, -1.1883676052093506e-06, 6.293877959251404e-06, 1.3776123523712158e-05, 2.1258369088172913e-05, 2.8740614652633667e-05, 3.622286021709442e-05, 4.3705105781555176e-05, 5.118735134601593e-05, 5.8669596910476685e-05, 6.615184247493744e-05, 7.36340880393982e-05, 8.111633360385895e-05, 8.85985791683197e-05, 9.608082473278046e-05, 0.00010356307029724121, 0.00011104531586170197, 0.00011852756142616272, 0.00012600980699062347, 0.00013349205255508423, 0.00014097429811954498, 0.00014845654368400574, 0.0001559387892484665, 0.00016342103481292725, 0.000170903280377388, 0.00017838552594184875, 0.0001858677715063095, 0.00019335001707077026, 0.00020083226263523102, 0.00020831450819969177, 0.00021579675376415253, 0.00022327899932861328]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 10.0, 7.0, 8.0, 21.0, 39.0, 43.0, 84.0, 116.0, 215.0, 412.0, 871.0, 2221.0, 6615.0, 30306.0, 225387.0, 634629.0, 121391.0, 18317.0, 4576.0, 1658.0, 763.0, 367.0, 187.0, 106.0, 79.0, 39.0, 27.0, 16.0, 13.0, 12.0, 3.0, 6.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.2222900390625, -0.216339111328125, -0.21038818359375, -0.204437255859375, -0.198486328125, -0.192535400390625, -0.18658447265625, -0.180633544921875, -0.1746826171875, -0.168731689453125, -0.16278076171875, -0.156829833984375, -0.15087890625, -0.144927978515625, -0.13897705078125, -0.133026123046875, -0.1270751953125, -0.121124267578125, -0.11517333984375, -0.109222412109375, -0.103271484375, -0.097320556640625, -0.09136962890625, -0.085418701171875, -0.0794677734375, -0.073516845703125, -0.06756591796875, -0.061614990234375, -0.0556640625, -0.049713134765625, -0.04376220703125, -0.037811279296875, -0.0318603515625, -0.025909423828125, -0.01995849609375, -0.014007568359375, -0.008056640625, -0.002105712890625, 0.00384521484375, 0.009796142578125, 0.0157470703125, 0.021697998046875, 0.02764892578125, 0.033599853515625, 0.03955078125, 0.045501708984375, 0.05145263671875, 0.057403564453125, 0.0633544921875, 0.069305419921875, 0.07525634765625, 0.081207275390625, 0.087158203125, 0.093109130859375, 0.09906005859375, 0.105010986328125, 0.1109619140625, 0.116912841796875, 0.12286376953125, 0.128814697265625, 0.134765625, 0.140716552734375, 0.14666748046875, 0.152618408203125, 0.1585693359375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 7.0, 7.0, 10.0, 12.0, 20.0, 34.0, 29.0, 58.0, 53.0, 83.0, 120.0, 129.0, 111.0, 80.0, 65.0, 54.0, 35.0, 34.0, 17.0, 14.0, 8.0, 9.0, 5.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2205810546875, -0.2140178680419922, -0.20745468139648438, -0.20089149475097656, -0.19432830810546875, -0.18776512145996094, -0.18120193481445312, -0.1746387481689453, -0.1680755615234375, -0.1615123748779297, -0.15494918823242188, -0.14838600158691406, -0.14182281494140625, -0.13525962829589844, -0.12869644165039062, -0.12213325500488281, -0.115570068359375, -0.10900688171386719, -0.10244369506835938, -0.09588050842285156, -0.08931732177734375, -0.08275413513183594, -0.07619094848632812, -0.06962776184082031, -0.0630645751953125, -0.05650138854980469, -0.049938201904296875, -0.04337501525878906, -0.03681182861328125, -0.030248641967773438, -0.023685455322265625, -0.017122268676757812, -0.01055908203125, -0.0039958953857421875, 0.002567291259765625, 0.009130477905273438, 0.01569366455078125, 0.022256851196289062, 0.028820037841796875, 0.03538322448730469, 0.0419464111328125, 0.04850959777832031, 0.055072784423828125, 0.06163597106933594, 0.06819915771484375, 0.07476234436035156, 0.08132553100585938, 0.08788871765136719, 0.094451904296875, 0.10101509094238281, 0.10757827758789062, 0.11414146423339844, 0.12070465087890625, 0.12726783752441406, 0.13383102416992188, 0.1403942108154297, 0.1469573974609375, 0.1535205841064453, 0.16008377075195312, 0.16664695739746094, 0.17321014404296875, 0.17977333068847656, 0.18633651733398438, 0.1928997039794922, 0.199462890625]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 5.0, 3.0, 14.0, 18.0, 25.0, 58.0, 86.0, 120.0, 173.0, 163.0, 134.0, 97.0, 58.0, 30.0, 13.0, 4.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4668079614639282, -1.3636301755905151, -1.260452389717102, -1.1572747230529785, -1.0540969371795654, -0.9509191513061523, -0.8477413654327393, -0.744563639163971, -0.6413858532905579, -0.5382080674171448, -0.43503034114837646, -0.3318525552749634, -0.22867479920387268, -0.12549704313278198, -0.022319257259368896, 0.08085846900939941, 0.1840362548828125, 0.2872140109539032, 0.3903917670249939, 0.493569552898407, 0.5967472791671753, 0.6999250650405884, 0.8031028509140015, 0.9062805771827698, 1.009458303451538, 1.1126360893249512, 1.2158138751983643, 1.3189916610717773, 1.4221693277359009, 1.525347113609314, 1.628524899482727, 1.7317025661468506, 1.8348805904388428, 1.9380583763122559, 2.041236162185669, 2.144413948059082, 2.247591733932495, 2.350769519805908, 2.453947067260742, 2.5571248531341553, 2.6603026390075684, 2.7634804248809814, 2.8666582107543945, 2.9698359966278076, 3.0730137825012207, 3.1761913299560547, 3.279369354248047, 3.382546901702881, 3.485724925994873, 3.588902711868286, 3.692080497741699, 3.7952582836151123, 3.8984360694885254, 4.001613616943359, 4.104791641235352, 4.2079691886901855, 4.3111467361450195, 4.4143242835998535, 4.517502307891846, 4.62067985534668, 4.723857879638672, 4.827035427093506, 4.930213451385498, 5.033390998840332, 5.136569023132324]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 4.0, 3.0, 5.0, 2.0, 5.0, 6.0, 9.0, 12.0, 11.0, 13.0, 24.0, 33.0, 27.0, 33.0, 37.0, 35.0, 46.0, 46.0, 41.0, 51.0, 48.0, 51.0, 51.0, 51.0, 46.0, 48.0, 43.0, 27.0, 43.0, 27.0, 24.0, 22.0, 18.0, 17.0, 13.0, 11.0, 4.0, 4.0, 6.0, 5.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6598448753356934, -2.5676393508911133, -2.475433826446533, -2.383228302001953, -2.291022777557373, -2.198817253112793, -2.106611728668213, -2.014406204223633, -1.9222005605697632, -1.829995036125183, -1.737789511680603, -1.6455838680267334, -1.5533783435821533, -1.4611728191375732, -1.3689672946929932, -1.276761770248413, -1.184556245803833, -1.092350721359253, -1.0001451969146729, -0.907939612865448, -0.8157340884208679, -0.7235285639762878, -0.631322979927063, -0.5391174554824829, -0.44691193103790283, -0.35470640659332275, -0.2625008523464203, -0.17029529809951782, -0.07808977365493774, 0.014115750789642334, 0.10632133483886719, 0.19852685928344727, 0.29073238372802734, 0.3829379081726074, 0.4751434624195099, 0.5673490166664124, 0.6595545411109924, 0.7517600655555725, 0.8439656496047974, 0.9361711740493774, 1.0283766984939575, 1.1205822229385376, 1.2127877473831177, 1.3049933910369873, 1.3971989154815674, 1.4894044399261475, 1.5816099643707275, 1.6738154888153076, 1.7660210132598877, 1.8582265377044678, 1.9504320621490479, 2.042637586593628, 2.134843111038208, 2.227048635482788, 2.3192543983459473, 2.4114599227905273, 2.5036654472351074, 2.5958709716796875, 2.6880764961242676, 2.7802820205688477, 2.8724875450134277, 2.964693069458008, 3.056898593902588, 3.149104118347168, 3.241309642791748]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 5.0, 11.0, 20.0, 24.0, 30.0, 43.0, 102.0, 206.0, 585.0, 2145.0, 13381.0, 4039464.0, 130696.0, 5554.0, 1294.0, 405.0, 148.0, 74.0, 40.0, 16.0, 14.0, 9.0, 5.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.154296875, -1.1273269653320312, -1.1003570556640625, -1.0733871459960938, -1.046417236328125, -1.0194473266601562, -0.9924774169921875, -0.9655075073242188, -0.93853759765625, -0.9115676879882812, -0.8845977783203125, -0.8576278686523438, -0.830657958984375, -0.8036880493164062, -0.7767181396484375, -0.7497482299804688, -0.7227783203125, -0.6958084106445312, -0.6688385009765625, -0.6418685913085938, -0.614898681640625, -0.5879287719726562, -0.5609588623046875, -0.5339889526367188, -0.50701904296875, -0.48004913330078125, -0.4530792236328125, -0.42610931396484375, -0.399139404296875, -0.37216949462890625, -0.3451995849609375, -0.31822967529296875, -0.291259765625, -0.26428985595703125, -0.2373199462890625, -0.21035003662109375, -0.183380126953125, -0.15641021728515625, -0.1294403076171875, -0.10247039794921875, -0.07550048828125, -0.04853057861328125, -0.0215606689453125, 0.00540924072265625, 0.032379150390625, 0.05934906005859375, 0.0863189697265625, 0.11328887939453125, 0.1402587890625, 0.16722869873046875, 0.1941986083984375, 0.22116851806640625, 0.248138427734375, 0.27510833740234375, 0.3020782470703125, 0.32904815673828125, 0.35601806640625, 0.38298797607421875, 0.4099578857421875, 0.43692779541015625, 0.463897705078125, 0.49086761474609375, 0.5178375244140625, 0.5448074340820312, 0.57177734375]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 2.0, 1.0, 1.0, 5.0, 4.0, 6.0, 12.0, 9.0, 7.0, 19.0, 33.0, 49.0, 59.0, 67.0, 83.0, 96.0, 95.0, 102.0, 76.0, 59.0, 64.0, 49.0, 31.0, 19.0, 19.0, 17.0, 13.0, 5.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1851806640625, -0.17846107482910156, -0.17174148559570312, -0.1650218963623047, -0.15830230712890625, -0.1515827178955078, -0.14486312866210938, -0.13814353942871094, -0.1314239501953125, -0.12470436096191406, -0.11798477172851562, -0.11126518249511719, -0.10454559326171875, -0.09782600402832031, -0.09110641479492188, -0.08438682556152344, -0.077667236328125, -0.07094764709472656, -0.06422805786132812, -0.05750846862792969, -0.05078887939453125, -0.04406929016113281, -0.037349700927734375, -0.030630111694335938, -0.0239105224609375, -0.017190933227539062, -0.010471343994140625, -0.0037517547607421875, 0.00296783447265625, 0.009687423706054688, 0.016407012939453125, 0.023126602172851562, 0.02984619140625, 0.03656578063964844, 0.043285369873046875, 0.05000495910644531, 0.05672454833984375, 0.06344413757324219, 0.07016372680664062, 0.07688331604003906, 0.0836029052734375, 0.09032249450683594, 0.09704208374023438, 0.10376167297363281, 0.11048126220703125, 0.11720085144042969, 0.12392044067382812, 0.13064002990722656, 0.137359619140625, 0.14407920837402344, 0.15079879760742188, 0.1575183868408203, 0.16423797607421875, 0.1709575653076172, 0.17767715454101562, 0.18439674377441406, 0.1911163330078125, 0.19783592224121094, 0.20455551147460938, 0.2112751007080078, 0.21799468994140625, 0.2247142791748047, 0.23143386840820312, 0.23815345764160156, 0.244873046875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 3.0, 2.0, 9.0, 10.0, 7.0, 11.0, 13.0, 26.0, 31.0, 54.0, 65.0, 82.0, 134.0, 178.0, 284.0, 467.0, 726.0, 1397.0, 2562.0, 5511.0, 13043.0, 41612.0, 351863.0, 3656497.0, 82923.0, 20436.0, 7994.0, 3606.0, 1867.0, 1078.0, 627.0, 411.0, 249.0, 164.0, 103.0, 78.0, 51.0, 37.0, 23.0, 15.0, 9.0, 8.0, 12.0, 7.0, 6.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.23828125, -0.23064804077148438, -0.22301483154296875, -0.21538162231445312, -0.2077484130859375, -0.20011520385742188, -0.19248199462890625, -0.18484878540039062, -0.177215576171875, -0.16958236694335938, -0.16194915771484375, -0.15431594848632812, -0.1466827392578125, -0.13904953002929688, -0.13141632080078125, -0.12378311157226562, -0.11614990234375, -0.10851669311523438, -0.10088348388671875, -0.09325027465820312, -0.0856170654296875, -0.07798385620117188, -0.07035064697265625, -0.06271743774414062, -0.055084228515625, -0.047451019287109375, -0.03981781005859375, -0.032184600830078125, -0.0245513916015625, -0.016918182373046875, -0.00928497314453125, -0.001651763916015625, 0.0059814453125, 0.013614654541015625, 0.02124786376953125, 0.028881072998046875, 0.0365142822265625, 0.044147491455078125, 0.05178070068359375, 0.059413909912109375, 0.067047119140625, 0.07468032836914062, 0.08231353759765625, 0.08994674682617188, 0.0975799560546875, 0.10521316528320312, 0.11284637451171875, 0.12047958374023438, 0.12811279296875, 0.13574600219726562, 0.14337921142578125, 0.15101242065429688, 0.1586456298828125, 0.16627883911132812, 0.17391204833984375, 0.18154525756835938, 0.189178466796875, 0.19681167602539062, 0.20444488525390625, 0.21207809448242188, 0.2197113037109375, 0.22734451293945312, 0.23497772216796875, 0.24261093139648438, 0.250244140625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 6.0, 8.0, 15.0, 25.0, 46.0, 91.0, 312.0, 3134.0, 264.0, 75.0, 31.0, 17.0, 11.0, 9.0, 13.0, 5.0, 4.0, 4.0, 2.0, 4.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0972900390625, -0.0944662094116211, -0.09164237976074219, -0.08881855010986328, -0.08599472045898438, -0.08317089080810547, -0.08034706115722656, -0.07752323150634766, -0.07469940185546875, -0.07187557220458984, -0.06905174255371094, -0.06622791290283203, -0.06340408325195312, -0.06058025360107422, -0.05775642395019531, -0.054932594299316406, -0.0521087646484375, -0.049284934997558594, -0.04646110534667969, -0.04363727569580078, -0.040813446044921875, -0.03798961639404297, -0.03516578674316406, -0.032341957092285156, -0.02951812744140625, -0.026694297790527344, -0.023870468139648438, -0.02104663848876953, -0.018222808837890625, -0.015398979187011719, -0.012575149536132812, -0.009751319885253906, -0.006927490234375, -0.004103660583496094, -0.0012798309326171875, 0.0015439987182617188, 0.004367828369140625, 0.007191658020019531, 0.010015487670898438, 0.012839317321777344, 0.01566314697265625, 0.018486976623535156, 0.021310806274414062, 0.02413463592529297, 0.026958465576171875, 0.02978229522705078, 0.03260612487792969, 0.035429954528808594, 0.0382537841796875, 0.041077613830566406, 0.04390144348144531, 0.04672527313232422, 0.049549102783203125, 0.05237293243408203, 0.05519676208496094, 0.058020591735839844, 0.06084442138671875, 0.06366825103759766, 0.06649208068847656, 0.06931591033935547, 0.07213973999023438, 0.07496356964111328, 0.07778739929199219, 0.0806112289428711, 0.08343505859375]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 19.0, 56.0, 154.0, 294.0, 285.0, 147.0, 40.0, 18.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16496023535728455, -0.14373484253883362, -0.12250944972038269, -0.10128405690193176, -0.08005866408348083, -0.05883327126502991, -0.03760787844657898, -0.016382485628128052, 0.004842907190322876, 0.026068300008773804, 0.04729369282722473, 0.06851908564567566, 0.08974447846412659, 0.11096987128257751, 0.13219526410102844, 0.15342065691947937, 0.1746460497379303, 0.19587144255638123, 0.21709683537483215, 0.23832222819328308, 0.259547621011734, 0.28077301383018494, 0.30199840664863586, 0.3232237994670868, 0.3444491922855377, 0.36567458510398865, 0.3868999779224396, 0.4081253707408905, 0.42935076355934143, 0.45057615637779236, 0.4718015491962433, 0.4930269420146942, 0.5142523050308228, 0.5354776978492737, 0.5567030906677246, 0.5779284834861755, 0.5991538763046265, 0.6203792691230774, 0.6416046619415283, 0.6628300547599792, 0.6840554475784302, 0.7052808403968811, 0.726506233215332, 0.747731626033783, 0.7689570188522339, 0.7901824116706848, 0.8114078044891357, 0.8326331973075867, 0.8538585901260376, 0.8750839829444885, 0.8963093757629395, 0.9175347685813904, 0.9387601613998413, 0.9599855542182922, 0.9812109470367432, 1.0024363994598389, 1.023661732673645, 1.0448870658874512, 1.0661125183105469, 1.0873379707336426, 1.1085633039474487, 1.1297886371612549, 1.1510140895843506, 1.1722395420074463, 1.1934648752212524]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 6.0, 2.0, 3.0, 6.0, 11.0, 12.0, 10.0, 14.0, 20.0, 18.0, 18.0, 29.0, 32.0, 23.0, 31.0, 34.0, 39.0, 50.0, 65.0, 44.0, 53.0, 48.0, 51.0, 27.0, 47.0, 38.0, 35.0, 33.0, 31.0, 32.0, 29.0, 13.0, 21.0, 19.0, 15.0, 11.0, 14.0, 7.0, 5.0, 6.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.14011520147323608, -0.13536687195301056, -0.13061852753162384, -0.12587019801139832, -0.12112186849117279, -0.11637353152036667, -0.11162519454956055, -0.10687686502933502, -0.1021285280585289, -0.09738019108772278, -0.09263186156749725, -0.08788352459669113, -0.08313518762588501, -0.07838685810565948, -0.07363852113485336, -0.06889018416404724, -0.06414185464382172, -0.05939352139830589, -0.05464518815279007, -0.04989685118198395, -0.045148517936468124, -0.0404001846909523, -0.03565184772014618, -0.030903514474630356, -0.026155181229114532, -0.02140684798359871, -0.016658512875437737, -0.011910178698599339, -0.0071618445217609406, -0.002413511276245117, 0.0023348238319158554, 0.007083158940076828, 0.011831492185592651, 0.016579825431108475, 0.021328160539269447, 0.02607649564743042, 0.030824828892946243, 0.03557316213846207, 0.04032149910926819, 0.04506983235478401, 0.049818165600299835, 0.05456649884581566, 0.05931483209133148, 0.0640631690621376, 0.06881150603294373, 0.07355983555316925, 0.07830817252397537, 0.0830565094947815, 0.08780483901500702, 0.09255317598581314, 0.09730150550603867, 0.10204984247684479, 0.10679817199707031, 0.11154650896787643, 0.11629484593868256, 0.12104317545890808, 0.1257915198802948, 0.13053984940052032, 0.13528819382190704, 0.14003652334213257, 0.1447848528623581, 0.14953318238258362, 0.15428152680397034, 0.15902985632419586, 0.1637781858444214]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 9.0, 6.0, 3.0, 14.0, 13.0, 23.0, 41.0, 58.0, 93.0, 149.0, 299.0, 618.0, 1330.0, 3100.0, 9602.0, 40256.0, 267894.0, 576998.0, 117094.0, 20935.0, 5984.0, 2179.0, 891.0, 418.0, 208.0, 124.0, 88.0, 49.0, 28.0, 19.0, 14.0, 5.0, 2.0, 7.0, 6.0, 1.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.44873046875, -0.43341064453125, -0.4180908203125, -0.40277099609375, -0.387451171875, -0.37213134765625, -0.3568115234375, -0.34149169921875, -0.326171875, -0.31085205078125, -0.2955322265625, -0.28021240234375, -0.264892578125, -0.24957275390625, -0.2342529296875, -0.21893310546875, -0.20361328125, -0.18829345703125, -0.1729736328125, -0.15765380859375, -0.142333984375, -0.12701416015625, -0.1116943359375, -0.09637451171875, -0.0810546875, -0.06573486328125, -0.0504150390625, -0.03509521484375, -0.019775390625, -0.00445556640625, 0.0108642578125, 0.02618408203125, 0.04150390625, 0.05682373046875, 0.0721435546875, 0.08746337890625, 0.102783203125, 0.11810302734375, 0.1334228515625, 0.14874267578125, 0.1640625, 0.17938232421875, 0.1947021484375, 0.21002197265625, 0.225341796875, 0.24066162109375, 0.2559814453125, 0.27130126953125, 0.28662109375, 0.30194091796875, 0.3172607421875, 0.33258056640625, 0.347900390625, 0.36322021484375, 0.3785400390625, 0.39385986328125, 0.4091796875, 0.42449951171875, 0.4398193359375, 0.45513916015625, 0.470458984375, 0.48577880859375, 0.5010986328125, 0.51641845703125, 0.53173828125]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 1.0, 1.0, 2.0, 4.0, 5.0, 5.0, 7.0, 11.0, 7.0, 15.0, 26.0, 46.0, 60.0, 68.0, 77.0, 76.0, 112.0, 91.0, 90.0, 67.0, 61.0, 45.0, 41.0, 19.0, 27.0, 18.0, 12.0, 4.0, 4.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.189208984375, -0.18241500854492188, -0.17562103271484375, -0.16882705688476562, -0.1620330810546875, -0.15523910522460938, -0.14844512939453125, -0.14165115356445312, -0.134857177734375, -0.12806320190429688, -0.12126922607421875, -0.11447525024414062, -0.1076812744140625, -0.10088729858398438, -0.09409332275390625, -0.08729934692382812, -0.08050537109375, -0.07371139526367188, -0.06691741943359375, -0.060123443603515625, -0.0533294677734375, -0.046535491943359375, -0.03974151611328125, -0.032947540283203125, -0.026153564453125, -0.019359588623046875, -0.01256561279296875, -0.005771636962890625, 0.0010223388671875, 0.007816314697265625, 0.01461029052734375, 0.021404266357421875, 0.0281982421875, 0.034992218017578125, 0.04178619384765625, 0.048580169677734375, 0.0553741455078125, 0.062168121337890625, 0.06896209716796875, 0.07575607299804688, 0.082550048828125, 0.08934402465820312, 0.09613800048828125, 0.10293197631835938, 0.1097259521484375, 0.11651992797851562, 0.12331390380859375, 0.13010787963867188, 0.13690185546875, 0.14369583129882812, 0.15048980712890625, 0.15728378295898438, 0.1640777587890625, 0.17087173461914062, 0.17766571044921875, 0.18445968627929688, 0.191253662109375, 0.19804763793945312, 0.20484161376953125, 0.21163558959960938, 0.2184295654296875, 0.22522354125976562, 0.23201751708984375, 0.23881149291992188, 0.24560546875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 3.0, 7.0, 8.0, 12.0, 22.0, 30.0, 75.0, 130.0, 230.0, 607.0, 1954.0, 9839.0, 191732.0, 803800.0, 34306.0, 3995.0, 1048.0, 388.0, 161.0, 84.0, 39.0, 31.0, 17.0, 10.0, 8.0, 7.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.80517578125, -0.7794113159179688, -0.7536468505859375, -0.7278823852539062, -0.702117919921875, -0.6763534545898438, -0.6505889892578125, -0.6248245239257812, -0.59906005859375, -0.5732955932617188, -0.5475311279296875, -0.5217666625976562, -0.496002197265625, -0.47023773193359375, -0.4444732666015625, -0.41870880126953125, -0.3929443359375, -0.36717987060546875, -0.3414154052734375, -0.31565093994140625, -0.289886474609375, -0.26412200927734375, -0.2383575439453125, -0.21259307861328125, -0.18682861328125, -0.16106414794921875, -0.1352996826171875, -0.10953521728515625, -0.083770751953125, -0.05800628662109375, -0.0322418212890625, -0.00647735595703125, 0.019287109375, 0.04505157470703125, 0.0708160400390625, 0.09658050537109375, 0.122344970703125, 0.14810943603515625, 0.1738739013671875, 0.19963836669921875, 0.22540283203125, 0.25116729736328125, 0.2769317626953125, 0.30269622802734375, 0.328460693359375, 0.35422515869140625, 0.3799896240234375, 0.40575408935546875, 0.4315185546875, 0.45728302001953125, 0.4830474853515625, 0.5088119506835938, 0.534576416015625, 0.5603408813476562, 0.5861053466796875, 0.6118698120117188, 0.63763427734375, 0.6633987426757812, 0.6891632080078125, 0.7149276733398438, 0.740692138671875, 0.7664566040039062, 0.7922210693359375, 0.8179855346679688, 0.84375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 4.0, 4.0, 1.0, 6.0, 3.0, 5.0, 5.0, 11.0, 13.0, 20.0, 25.0, 34.0, 42.0, 50.0, 50.0, 40.0, 67.0, 47.0, 62.0, 50.0, 52.0, 77.0, 58.0, 54.0, 48.0, 40.0, 23.0, 25.0, 23.0, 15.0, 16.0, 8.0, 7.0, 9.0, 3.0, 2.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.7509765625, -0.72625732421875, -0.7015380859375, -0.67681884765625, -0.652099609375, -0.62738037109375, -0.6026611328125, -0.57794189453125, -0.55322265625, -0.52850341796875, -0.5037841796875, -0.47906494140625, -0.454345703125, -0.42962646484375, -0.4049072265625, -0.38018798828125, -0.35546875, -0.33074951171875, -0.3060302734375, -0.28131103515625, -0.256591796875, -0.23187255859375, -0.2071533203125, -0.18243408203125, -0.15771484375, -0.13299560546875, -0.1082763671875, -0.08355712890625, -0.058837890625, -0.03411865234375, -0.0093994140625, 0.01531982421875, 0.0400390625, 0.06475830078125, 0.0894775390625, 0.11419677734375, 0.138916015625, 0.16363525390625, 0.1883544921875, 0.21307373046875, 0.23779296875, 0.26251220703125, 0.2872314453125, 0.31195068359375, 0.336669921875, 0.36138916015625, 0.3861083984375, 0.41082763671875, 0.435546875, 0.46026611328125, 0.4849853515625, 0.50970458984375, 0.534423828125, 0.55914306640625, 0.5838623046875, 0.60858154296875, 0.63330078125, 0.65802001953125, 0.6827392578125, 0.70745849609375, 0.732177734375, 0.75689697265625, 0.7816162109375, 0.80633544921875, 0.8310546875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 4.0, 6.0, 9.0, 11.0, 12.0, 15.0, 20.0, 24.0, 38.0, 52.0, 96.0, 147.0, 242.0, 519.0, 1287.0, 4695.0, 45954.0, 920259.0, 67026.0, 5390.0, 1479.0, 541.0, 288.0, 125.0, 92.0, 65.0, 36.0, 26.0, 19.0, 22.0, 14.0, 6.0, 9.0, 6.0, 7.0, 3.0, 0.0, 3.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 4.0], "bins": [-0.427734375, -0.41498565673828125, -0.4022369384765625, -0.38948822021484375, -0.376739501953125, -0.36399078369140625, -0.3512420654296875, -0.33849334716796875, -0.32574462890625, -0.31299591064453125, -0.3002471923828125, -0.28749847412109375, -0.274749755859375, -0.26200103759765625, -0.2492523193359375, -0.23650360107421875, -0.2237548828125, -0.21100616455078125, -0.1982574462890625, -0.18550872802734375, -0.172760009765625, -0.16001129150390625, -0.1472625732421875, -0.13451385498046875, -0.12176513671875, -0.10901641845703125, -0.0962677001953125, -0.08351898193359375, -0.070770263671875, -0.05802154541015625, -0.0452728271484375, -0.03252410888671875, -0.019775390625, -0.00702667236328125, 0.0057220458984375, 0.01847076416015625, 0.031219482421875, 0.04396820068359375, 0.0567169189453125, 0.06946563720703125, 0.08221435546875, 0.09496307373046875, 0.1077117919921875, 0.12046051025390625, 0.133209228515625, 0.14595794677734375, 0.1587066650390625, 0.17145538330078125, 0.1842041015625, 0.19695281982421875, 0.2097015380859375, 0.22245025634765625, 0.235198974609375, 0.24794769287109375, 0.2606964111328125, 0.27344512939453125, 0.28619384765625, 0.29894256591796875, 0.3116912841796875, 0.32444000244140625, 0.337188720703125, 0.34993743896484375, 0.3626861572265625, 0.37543487548828125, 0.38818359375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 5.0, 8.0, 10.0, 18.0, 22.0, 35.0, 60.0, 80.0, 119.0, 117.0, 111.0, 124.0, 94.0, 73.0, 45.0, 23.0, 23.0, 12.0, 8.0, 6.0, 9.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.522106170654297e-05, -7.06017017364502e-05, -6.598234176635742e-05, -6.136298179626465e-05, -5.6743621826171875e-05, -5.21242618560791e-05, -4.750490188598633e-05, -4.2885541915893555e-05, -3.826618194580078e-05, -3.364682197570801e-05, -2.9027462005615234e-05, -2.440810203552246e-05, -1.9788742065429688e-05, -1.5169382095336914e-05, -1.055002212524414e-05, -5.930662155151367e-06, -1.3113021850585938e-06, 3.3080577850341797e-06, 7.927417755126953e-06, 1.2546777725219727e-05, 1.71661376953125e-05, 2.1785497665405273e-05, 2.6404857635498047e-05, 3.102421760559082e-05, 3.5643577575683594e-05, 4.026293754577637e-05, 4.488229751586914e-05, 4.9501657485961914e-05, 5.412101745605469e-05, 5.874037742614746e-05, 6.335973739624023e-05, 6.797909736633301e-05, 7.259845733642578e-05, 7.721781730651855e-05, 8.183717727661133e-05, 8.64565372467041e-05, 9.107589721679688e-05, 9.569525718688965e-05, 0.00010031461715698242, 0.0001049339771270752, 0.00010955333709716797, 0.00011417269706726074, 0.00011879205703735352, 0.0001234114170074463, 0.00012803077697753906, 0.00013265013694763184, 0.0001372694969177246, 0.00014188885688781738, 0.00014650821685791016, 0.00015112757682800293, 0.0001557469367980957, 0.00016036629676818848, 0.00016498565673828125, 0.00016960501670837402, 0.0001742243766784668, 0.00017884373664855957, 0.00018346309661865234, 0.00018808245658874512, 0.0001927018165588379, 0.00019732117652893066, 0.00020194053649902344, 0.0002065598964691162, 0.00021117925643920898, 0.00021579861640930176, 0.00022041797637939453]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 3.0, 3.0, 4.0, 8.0, 8.0, 16.0, 14.0, 32.0, 55.0, 111.0, 229.0, 582.0, 1733.0, 7077.0, 76156.0, 853990.0, 97379.0, 8149.0, 1854.0, 640.0, 251.0, 108.0, 50.0, 28.0, 18.0, 11.0, 12.0, 3.0, 4.0, 10.0, 1.0, 3.0, 2.0, 1.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.34716796875, -0.3373985290527344, -0.32762908935546875, -0.3178596496582031, -0.3080902099609375, -0.2983207702636719, -0.28855133056640625, -0.2787818908691406, -0.269012451171875, -0.2592430114746094, -0.24947357177734375, -0.23970413208007812, -0.2299346923828125, -0.22016525268554688, -0.21039581298828125, -0.20062637329101562, -0.19085693359375, -0.18108749389648438, -0.17131805419921875, -0.16154861450195312, -0.1517791748046875, -0.14200973510742188, -0.13224029541015625, -0.12247085571289062, -0.112701416015625, -0.10293197631835938, -0.09316253662109375, -0.08339309692382812, -0.0736236572265625, -0.06385421752929688, -0.05408477783203125, -0.044315338134765625, -0.0345458984375, -0.024776458740234375, -0.01500701904296875, -0.005237579345703125, 0.0045318603515625, 0.014301300048828125, 0.02407073974609375, 0.033840179443359375, 0.043609619140625, 0.053379058837890625, 0.06314849853515625, 0.07291793823242188, 0.0826873779296875, 0.09245681762695312, 0.10222625732421875, 0.11199569702148438, 0.12176513671875, 0.13153457641601562, 0.14130401611328125, 0.15107345581054688, 0.1608428955078125, 0.17061233520507812, 0.18038177490234375, 0.19015121459960938, 0.199920654296875, 0.20969009399414062, 0.21945953369140625, 0.22922897338867188, 0.2389984130859375, 0.24876785278320312, 0.25853729248046875, 0.2683067321777344, 0.278076171875]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 4.0, 10.0, 5.0, 13.0, 23.0, 25.0, 54.0, 85.0, 110.0, 138.0, 178.0, 125.0, 81.0, 57.0, 25.0, 18.0, 15.0, 6.0, 8.0, 3.0, 6.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.35791015625, -0.3473472595214844, -0.33678436279296875, -0.3262214660644531, -0.3156585693359375, -0.3050956726074219, -0.29453277587890625, -0.2839698791503906, -0.273406982421875, -0.2628440856933594, -0.25228118896484375, -0.24171829223632812, -0.2311553955078125, -0.22059249877929688, -0.21002960205078125, -0.19946670532226562, -0.18890380859375, -0.17834091186523438, -0.16777801513671875, -0.15721511840820312, -0.1466522216796875, -0.13608932495117188, -0.12552642822265625, -0.11496353149414062, -0.104400634765625, -0.09383773803710938, -0.08327484130859375, -0.07271194458007812, -0.0621490478515625, -0.051586151123046875, -0.04102325439453125, -0.030460357666015625, -0.0198974609375, -0.009334564208984375, 0.00122833251953125, 0.011791229248046875, 0.0223541259765625, 0.032917022705078125, 0.04347991943359375, 0.054042816162109375, 0.064605712890625, 0.07516860961914062, 0.08573150634765625, 0.09629440307617188, 0.1068572998046875, 0.11742019653320312, 0.12798309326171875, 0.13854598999023438, 0.14910888671875, 0.15967178344726562, 0.17023468017578125, 0.18079757690429688, 0.1913604736328125, 0.20192337036132812, 0.21248626708984375, 0.22304916381835938, 0.233612060546875, 0.24417495727539062, 0.25473785400390625, 0.2653007507324219, 0.2758636474609375, 0.2864265441894531, 0.29698944091796875, 0.3075523376464844, 0.318115234375]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 5.0, 8.0, 11.0, 26.0, 68.0, 110.0, 208.0, 237.0, 165.0, 101.0, 43.0, 10.0, 9.0, 2.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.714663505554199, -5.53700065612793, -5.35933780670166, -5.181674957275391, -5.004011631011963, -4.826348781585693, -4.648685932159424, -4.471023082733154, -4.293359756469727, -4.115696907043457, -3.9380338191986084, -3.760370969772339, -3.5827078819274902, -3.4050450325012207, -3.227382183074951, -3.0497193336486816, -2.872056484222412, -2.6943936347961426, -2.516730546951294, -2.3390676975250244, -2.161404609680176, -1.9837417602539062, -1.8060789108276367, -1.6284159421920776, -1.4507529735565186, -1.2730900049209595, -1.0954270362854004, -0.9177641868591309, -0.7401012182235718, -0.5624382495880127, -0.38477540016174316, -0.20711243152618408, -0.029449939727783203, 0.1482129991054535, 0.3258759379386902, 0.5035388469696045, 0.6812018156051636, 0.8588647842407227, 1.0365276336669922, 1.2141906023025513, 1.3918535709381104, 1.5695165395736694, 1.7471795082092285, 1.924842357635498, 2.1025052070617676, 2.280168294906616, 2.4578311443328857, 2.6354942321777344, 2.813157081604004, 2.9908199310302734, 3.168483018875122, 3.3461458683013916, 3.5238089561462402, 3.7014718055725098, 3.8791346549987793, 4.056797504425049, 4.234460830688477, 4.412123680114746, 4.589786529541016, 4.767449378967285, 4.945112705230713, 5.122775554656982, 5.300438404083252, 5.4781012535095215, 5.655764102935791]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 7.0, 8.0, 11.0, 11.0, 14.0, 18.0, 18.0, 19.0, 30.0, 29.0, 53.0, 35.0, 59.0, 56.0, 58.0, 75.0, 55.0, 63.0, 62.0, 42.0, 53.0, 35.0, 23.0, 33.0, 32.0, 12.0, 10.0, 19.0, 13.0, 11.0, 10.0, 7.0, 5.0, 5.0, 3.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.7983930110931396, -3.6759300231933594, -3.553467035293579, -3.431004047393799, -3.3085408210754395, -3.1860780715942383, -3.063614845275879, -2.9411518573760986, -2.8186888694763184, -2.696225881576538, -2.573762893676758, -2.4512999057769775, -2.3288369178771973, -2.206373691558838, -2.0839107036590576, -1.9614477157592773, -1.838984727859497, -1.7165217399597168, -1.5940587520599365, -1.4715956449508667, -1.3491326570510864, -1.2266696691513062, -1.1042065620422363, -0.981743574142456, -0.8592805862426758, -0.7368175983428955, -0.6143545508384705, -0.4918915331363678, -0.36942851543426514, -0.24696552753448486, -0.12450248003005981, -0.0020394325256347656, 0.12042379379272461, 0.24288681149482727, 0.36534982919692993, 0.4878128468990326, 0.6102758646011353, 0.7327388525009155, 0.8552019000053406, 0.9776649475097656, 1.100127935409546, 1.2225909233093262, 1.3450539112091064, 1.4675170183181763, 1.5899800062179565, 1.7124429941177368, 1.8349061012268066, 1.957369089126587, 2.079832077026367, 2.2022950649261475, 2.3247580528259277, 2.447221040725708, 2.5696840286254883, 2.6921472549438477, 2.814610242843628, 2.937073230743408, 3.0595362186431885, 3.1819992065429688, 3.304462194442749, 3.4269251823425293, 3.5493884086608887, 3.67185115814209, 3.794314384460449, 3.9167773723602295, 4.03924036026001]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 0.0, 2.0, 5.0, 4.0, 10.0, 11.0, 15.0, 19.0, 26.0, 30.0, 48.0, 103.0, 172.0, 373.0, 870.0, 2275.0, 7394.0, 40694.0, 3831087.0, 283635.0, 19770.0, 4768.0, 1621.0, 666.0, 296.0, 145.0, 85.0, 51.0, 34.0, 28.0, 17.0, 12.0, 5.0, 5.0, 5.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.61767578125, -0.6025428771972656, -0.5874099731445312, -0.5722770690917969, -0.5571441650390625, -0.5420112609863281, -0.5268783569335938, -0.5117454528808594, -0.496612548828125, -0.4814796447753906, -0.46634674072265625, -0.4512138366699219, -0.4360809326171875, -0.4209480285644531, -0.40581512451171875, -0.3906822204589844, -0.37554931640625, -0.3604164123535156, -0.34528350830078125, -0.3301506042480469, -0.3150177001953125, -0.2998847961425781, -0.28475189208984375, -0.2696189880371094, -0.254486083984375, -0.23935317993164062, -0.22422027587890625, -0.20908737182617188, -0.1939544677734375, -0.17882156372070312, -0.16368865966796875, -0.14855575561523438, -0.1334228515625, -0.11828994750976562, -0.10315704345703125, -0.08802413940429688, -0.0728912353515625, -0.057758331298828125, -0.04262542724609375, -0.027492523193359375, -0.012359619140625, 0.002773284912109375, 0.01790618896484375, 0.033039093017578125, 0.0481719970703125, 0.06330490112304688, 0.07843780517578125, 0.09357070922851562, 0.10870361328125, 0.12383651733398438, 0.13896942138671875, 0.15410232543945312, 0.1692352294921875, 0.18436813354492188, 0.19950103759765625, 0.21463394165039062, 0.229766845703125, 0.24489974975585938, 0.26003265380859375, 0.2751655578613281, 0.2902984619140625, 0.3054313659667969, 0.32056427001953125, 0.3356971740722656, 0.350830078125]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 2.0, 4.0, 6.0, 9.0, 11.0, 10.0, 20.0, 19.0, 28.0, 31.0, 57.0, 61.0, 65.0, 85.0, 89.0, 84.0, 97.0, 66.0, 47.0, 54.0, 49.0, 26.0, 27.0, 17.0, 16.0, 8.0, 6.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.189453125, -0.18270111083984375, -0.1759490966796875, -0.16919708251953125, -0.162445068359375, -0.15569305419921875, -0.1489410400390625, -0.14218902587890625, -0.13543701171875, -0.12868499755859375, -0.1219329833984375, -0.11518096923828125, -0.108428955078125, -0.10167694091796875, -0.0949249267578125, -0.08817291259765625, -0.0814208984375, -0.07466888427734375, -0.0679168701171875, -0.06116485595703125, -0.054412841796875, -0.04766082763671875, -0.0409088134765625, -0.03415679931640625, -0.02740478515625, -0.02065277099609375, -0.0139007568359375, -0.00714874267578125, -0.000396728515625, 0.00635528564453125, 0.0131072998046875, 0.01985931396484375, 0.026611328125, 0.03336334228515625, 0.0401153564453125, 0.04686737060546875, 0.053619384765625, 0.06037139892578125, 0.0671234130859375, 0.07387542724609375, 0.08062744140625, 0.08737945556640625, 0.0941314697265625, 0.10088348388671875, 0.107635498046875, 0.11438751220703125, 0.1211395263671875, 0.12789154052734375, 0.1346435546875, 0.14139556884765625, 0.1481475830078125, 0.15489959716796875, 0.161651611328125, 0.16840362548828125, 0.1751556396484375, 0.18190765380859375, 0.18865966796875, 0.19541168212890625, 0.2021636962890625, 0.20891571044921875, 0.215667724609375, 0.22241973876953125, 0.2291717529296875, 0.23592376708984375, 0.24267578125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 6.0, 6.0, 6.0, 11.0, 15.0, 20.0, 38.0, 50.0, 74.0, 126.0, 142.0, 278.0, 478.0, 899.0, 1875.0, 4630.0, 15585.0, 105456.0, 3853984.0, 179843.0, 20549.0, 5602.0, 2224.0, 996.0, 536.0, 291.0, 177.0, 127.0, 85.0, 48.0, 42.0, 24.0, 19.0, 11.0, 10.0, 8.0, 5.0, 6.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.397705078125, -0.3851165771484375, -0.372528076171875, -0.3599395751953125, -0.34735107421875, -0.3347625732421875, -0.322174072265625, -0.3095855712890625, -0.2969970703125, -0.2844085693359375, -0.271820068359375, -0.2592315673828125, -0.24664306640625, -0.2340545654296875, -0.221466064453125, -0.2088775634765625, -0.1962890625, -0.1837005615234375, -0.171112060546875, -0.1585235595703125, -0.14593505859375, -0.1333465576171875, -0.120758056640625, -0.1081695556640625, -0.0955810546875, -0.0829925537109375, -0.070404052734375, -0.0578155517578125, -0.04522705078125, -0.0326385498046875, -0.020050048828125, -0.0074615478515625, 0.005126953125, 0.0177154541015625, 0.030303955078125, 0.0428924560546875, 0.05548095703125, 0.0680694580078125, 0.080657958984375, 0.0932464599609375, 0.1058349609375, 0.1184234619140625, 0.131011962890625, 0.1436004638671875, 0.15618896484375, 0.1687774658203125, 0.181365966796875, 0.1939544677734375, 0.20654296875, 0.2191314697265625, 0.231719970703125, 0.2443084716796875, 0.25689697265625, 0.2694854736328125, 0.282073974609375, 0.2946624755859375, 0.3072509765625, 0.3198394775390625, 0.332427978515625, 0.3450164794921875, 0.35760498046875, 0.3701934814453125, 0.382781982421875, 0.3953704833984375, 0.407958984375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 12.0, 15.0, 21.0, 49.0, 135.0, 489.0, 2912.0, 253.0, 96.0, 32.0, 21.0, 15.0, 6.0, 5.0, 0.0, 5.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1610107421875, -0.1563262939453125, -0.151641845703125, -0.1469573974609375, -0.14227294921875, -0.1375885009765625, -0.132904052734375, -0.1282196044921875, -0.12353515625, -0.1188507080078125, -0.114166259765625, -0.1094818115234375, -0.10479736328125, -0.1001129150390625, -0.095428466796875, -0.0907440185546875, -0.0860595703125, -0.0813751220703125, -0.076690673828125, -0.0720062255859375, -0.06732177734375, -0.0626373291015625, -0.057952880859375, -0.0532684326171875, -0.048583984375, -0.0438995361328125, -0.039215087890625, -0.0345306396484375, -0.02984619140625, -0.0251617431640625, -0.020477294921875, -0.0157928466796875, -0.0111083984375, -0.0064239501953125, -0.001739501953125, 0.0029449462890625, 0.00762939453125, 0.0123138427734375, 0.016998291015625, 0.0216827392578125, 0.0263671875, 0.0310516357421875, 0.035736083984375, 0.0404205322265625, 0.04510498046875, 0.0497894287109375, 0.054473876953125, 0.0591583251953125, 0.0638427734375, 0.0685272216796875, 0.073211669921875, 0.0778961181640625, 0.08258056640625, 0.0872650146484375, 0.091949462890625, 0.0966339111328125, 0.101318359375, 0.1060028076171875, 0.110687255859375, 0.1153717041015625, 0.12005615234375, 0.1247406005859375, 0.129425048828125, 0.1341094970703125, 0.1387939453125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 4.0, 18.0, 29.0, 64.0, 105.0, 148.0, 196.0, 170.0, 137.0, 71.0, 44.0, 12.0, 8.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.9417344331741333, -0.923327624797821, -0.9049208164215088, -0.8865140676498413, -0.868107259273529, -0.8497004508972168, -0.8312937021255493, -0.8128868937492371, -0.7944800853729248, -0.7760732769966125, -0.7576664686203003, -0.7392597198486328, -0.7208529114723206, -0.7024461030960083, -0.6840393543243408, -0.6656325459480286, -0.6472257375717163, -0.628818929195404, -0.6104121208190918, -0.5920053720474243, -0.5735985636711121, -0.5551917552947998, -0.5367850065231323, -0.5183781981468201, -0.4999713897705078, -0.48156458139419556, -0.4631578028202057, -0.4447510242462158, -0.42634421586990356, -0.4079374074935913, -0.38953062891960144, -0.3711238503456116, -0.3527171015739441, -0.33431029319763184, -0.31590351462364197, -0.2974967360496521, -0.27908992767333984, -0.2606831192970276, -0.24227634072303772, -0.22386954724788666, -0.2054627537727356, -0.18705596029758453, -0.16864916682243347, -0.1502423733472824, -0.13183557987213135, -0.11342878639698029, -0.09502199292182922, -0.07661519944667816, -0.0582084059715271, -0.03980161249637604, -0.021394819021224976, -0.0029880255460739136, 0.015418767929077148, 0.03382556140422821, 0.05223235487937927, 0.07063914835453033, 0.0890459418296814, 0.10745273530483246, 0.12585952877998352, 0.14426632225513458, 0.16267311573028564, 0.1810799092054367, 0.19948670268058777, 0.21789349615573883, 0.2363002896308899]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 1.0, 8.0, 8.0, 17.0, 12.0, 11.0, 10.0, 20.0, 18.0, 20.0, 24.0, 32.0, 27.0, 41.0, 43.0, 34.0, 37.0, 47.0, 51.0, 35.0, 44.0, 47.0, 46.0, 37.0, 41.0, 27.0, 25.0, 35.0, 32.0, 19.0, 26.0, 25.0, 20.0, 19.0, 11.0, 16.0, 7.0, 4.0, 9.0, 4.0, 5.0, 1.0, 3.0, 3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0], "bins": [-0.23878049850463867, -0.2317516803741455, -0.22472284734249115, -0.2176940143108368, -0.21066519618034363, -0.20363637804985046, -0.1966075450181961, -0.18957871198654175, -0.18254989385604858, -0.17552107572555542, -0.16849224269390106, -0.1614634096622467, -0.15443459153175354, -0.14740577340126038, -0.14037694036960602, -0.13334810733795166, -0.1263192892074585, -0.11929046362638474, -0.11226163804531097, -0.10523281246423721, -0.09820398688316345, -0.09117516130208969, -0.08414633572101593, -0.07711751013994217, -0.07008868455886841, -0.06305985897779465, -0.056031033396720886, -0.049002207815647125, -0.041973382234573364, -0.0349445566534996, -0.027915731072425842, -0.02088690549135208, -0.01385807991027832, -0.006829254329204559, 0.00019957125186920166, 0.007228396832942963, 0.014257222414016724, 0.021286047995090485, 0.028314873576164246, 0.03534369915723801, 0.04237252473831177, 0.04940135031938553, 0.05643017590045929, 0.06345900148153305, 0.07048782706260681, 0.07751665264368057, 0.08454547822475433, 0.0915743038058281, 0.09860312938690186, 0.10563195496797562, 0.11266078054904938, 0.11968960613012314, 0.1267184317111969, 0.13374724984169006, 0.14077608287334442, 0.14780491590499878, 0.15483373403549194, 0.1618625521659851, 0.16889138519763947, 0.17592021822929382, 0.182949036359787, 0.18997785449028015, 0.1970066875219345, 0.20403552055358887, 0.21106433868408203]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 8.0, 6.0, 17.0, 17.0, 27.0, 36.0, 101.0, 139.0, 281.0, 544.0, 1100.0, 3105.0, 9596.0, 39409.0, 204935.0, 538578.0, 197740.0, 38295.0, 9313.0, 2995.0, 1163.0, 520.0, 269.0, 144.0, 85.0, 55.0, 26.0, 13.0, 13.0, 9.0, 7.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.41015625, -0.3992156982421875, -0.388275146484375, -0.3773345947265625, -0.36639404296875, -0.3554534912109375, -0.344512939453125, -0.3335723876953125, -0.3226318359375, -0.3116912841796875, -0.300750732421875, -0.2898101806640625, -0.27886962890625, -0.2679290771484375, -0.256988525390625, -0.2460479736328125, -0.235107421875, -0.2241668701171875, -0.213226318359375, -0.2022857666015625, -0.19134521484375, -0.1804046630859375, -0.169464111328125, -0.1585235595703125, -0.1475830078125, -0.1366424560546875, -0.125701904296875, -0.1147613525390625, -0.10382080078125, -0.0928802490234375, -0.081939697265625, -0.0709991455078125, -0.06005859375, -0.0491180419921875, -0.038177490234375, -0.0272369384765625, -0.01629638671875, -0.0053558349609375, 0.005584716796875, 0.0165252685546875, 0.0274658203125, 0.0384063720703125, 0.049346923828125, 0.0602874755859375, 0.07122802734375, 0.0821685791015625, 0.093109130859375, 0.1040496826171875, 0.114990234375, 0.1259307861328125, 0.136871337890625, 0.1478118896484375, 0.15875244140625, 0.1696929931640625, 0.180633544921875, 0.1915740966796875, 0.2025146484375, 0.2134552001953125, 0.224395751953125, 0.2353363037109375, 0.24627685546875, 0.2572174072265625, 0.268157958984375, 0.2790985107421875, 0.2900390625]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 6.0, 2.0, 8.0, 9.0, 18.0, 19.0, 18.0, 20.0, 37.0, 39.0, 62.0, 66.0, 66.0, 72.0, 83.0, 94.0, 78.0, 58.0, 53.0, 41.0, 39.0, 42.0, 17.0, 18.0, 10.0, 6.0, 6.0, 8.0, 1.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18896484375, -0.18257522583007812, -0.17618560791015625, -0.16979598999023438, -0.1634063720703125, -0.15701675415039062, -0.15062713623046875, -0.14423751831054688, -0.137847900390625, -0.13145828247070312, -0.12506866455078125, -0.11867904663085938, -0.1122894287109375, -0.10589981079101562, -0.09951019287109375, -0.09312057495117188, -0.08673095703125, -0.08034133911132812, -0.07395172119140625, -0.06756210327148438, -0.0611724853515625, -0.054782867431640625, -0.04839324951171875, -0.042003631591796875, -0.035614013671875, -0.029224395751953125, -0.02283477783203125, -0.016445159912109375, -0.0100555419921875, -0.003665924072265625, 0.00272369384765625, 0.009113311767578125, 0.0155029296875, 0.021892547607421875, 0.02828216552734375, 0.034671783447265625, 0.0410614013671875, 0.047451019287109375, 0.05384063720703125, 0.060230255126953125, 0.066619873046875, 0.07300949096679688, 0.07939910888671875, 0.08578872680664062, 0.0921783447265625, 0.09856796264648438, 0.10495758056640625, 0.11134719848632812, 0.11773681640625, 0.12412643432617188, 0.13051605224609375, 0.13690567016601562, 0.1432952880859375, 0.14968490600585938, 0.15607452392578125, 0.16246414184570312, 0.168853759765625, 0.17524337768554688, 0.18163299560546875, 0.18802261352539062, 0.1944122314453125, 0.20080184936523438, 0.20719146728515625, 0.21358108520507812, 0.219970703125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 6.0, 4.0, 4.0, 8.0, 5.0, 5.0, 6.0, 13.0, 9.0, 19.0, 37.0, 60.0, 90.0, 179.0, 491.0, 1630.0, 10121.0, 322327.0, 693195.0, 17001.0, 2233.0, 592.0, 238.0, 104.0, 67.0, 38.0, 23.0, 11.0, 12.0, 2.0, 6.0, 9.0, 6.0, 3.0, 2.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.6201171875, -0.594390869140625, -0.56866455078125, -0.542938232421875, -0.5172119140625, -0.491485595703125, -0.46575927734375, -0.440032958984375, -0.414306640625, -0.388580322265625, -0.36285400390625, -0.337127685546875, -0.3114013671875, -0.285675048828125, -0.25994873046875, -0.234222412109375, -0.20849609375, -0.182769775390625, -0.15704345703125, -0.131317138671875, -0.1055908203125, -0.079864501953125, -0.05413818359375, -0.028411865234375, -0.002685546875, 0.023040771484375, 0.04876708984375, 0.074493408203125, 0.1002197265625, 0.125946044921875, 0.15167236328125, 0.177398681640625, 0.203125, 0.228851318359375, 0.25457763671875, 0.280303955078125, 0.3060302734375, 0.331756591796875, 0.35748291015625, 0.383209228515625, 0.408935546875, 0.434661865234375, 0.46038818359375, 0.486114501953125, 0.5118408203125, 0.537567138671875, 0.56329345703125, 0.589019775390625, 0.61474609375, 0.640472412109375, 0.66619873046875, 0.691925048828125, 0.7176513671875, 0.743377685546875, 0.76910400390625, 0.794830322265625, 0.820556640625, 0.846282958984375, 0.87200927734375, 0.897735595703125, 0.9234619140625, 0.949188232421875, 0.97491455078125, 1.000640869140625, 1.0263671875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 4.0, 2.0, 3.0, 9.0, 4.0, 4.0, 5.0, 8.0, 10.0, 11.0, 13.0, 14.0, 17.0, 24.0, 38.0, 30.0, 40.0, 33.0, 51.0, 60.0, 62.0, 54.0, 56.0, 52.0, 78.0, 59.0, 42.0, 35.0, 28.0, 28.0, 21.0, 24.0, 14.0, 9.0, 13.0, 8.0, 6.0, 4.0, 5.0, 2.0, 7.0, 6.0, 0.0, 5.0, 2.0, 3.0, 3.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 3.0], "bins": [-0.68896484375, -0.6676483154296875, -0.646331787109375, -0.6250152587890625, -0.60369873046875, -0.5823822021484375, -0.561065673828125, -0.5397491455078125, -0.5184326171875, -0.4971160888671875, -0.475799560546875, -0.4544830322265625, -0.43316650390625, -0.4118499755859375, -0.390533447265625, -0.3692169189453125, -0.347900390625, -0.3265838623046875, -0.305267333984375, -0.2839508056640625, -0.26263427734375, -0.2413177490234375, -0.220001220703125, -0.1986846923828125, -0.1773681640625, -0.1560516357421875, -0.134735107421875, -0.1134185791015625, -0.09210205078125, -0.0707855224609375, -0.049468994140625, -0.0281524658203125, -0.0068359375, 0.0144805908203125, 0.035797119140625, 0.0571136474609375, 0.07843017578125, 0.0997467041015625, 0.121063232421875, 0.1423797607421875, 0.1636962890625, 0.1850128173828125, 0.206329345703125, 0.2276458740234375, 0.24896240234375, 0.2702789306640625, 0.291595458984375, 0.3129119873046875, 0.334228515625, 0.3555450439453125, 0.376861572265625, 0.3981781005859375, 0.41949462890625, 0.4408111572265625, 0.462127685546875, 0.4834442138671875, 0.5047607421875, 0.5260772705078125, 0.547393798828125, 0.5687103271484375, 0.59002685546875, 0.6113433837890625, 0.632659912109375, 0.6539764404296875, 0.67529296875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 12.0, 20.0, 25.0, 35.0, 90.0, 178.0, 545.0, 2436.0, 53290.0, 969434.0, 20081.0, 1635.0, 416.0, 166.0, 70.0, 41.0, 32.0, 22.0, 5.0, 5.0, 5.0, 5.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.62255859375, -0.6067543029785156, -0.5909500122070312, -0.5751457214355469, -0.5593414306640625, -0.5435371398925781, -0.5277328491210938, -0.5119285583496094, -0.496124267578125, -0.4803199768066406, -0.46451568603515625, -0.4487113952636719, -0.4329071044921875, -0.4171028137207031, -0.40129852294921875, -0.3854942321777344, -0.36968994140625, -0.3538856506347656, -0.33808135986328125, -0.3222770690917969, -0.3064727783203125, -0.2906684875488281, -0.27486419677734375, -0.2590599060058594, -0.243255615234375, -0.22745132446289062, -0.21164703369140625, -0.19584274291992188, -0.1800384521484375, -0.16423416137695312, -0.14842987060546875, -0.13262557983398438, -0.1168212890625, -0.10101699829101562, -0.08521270751953125, -0.06940841674804688, -0.0536041259765625, -0.037799835205078125, -0.02199554443359375, -0.006191253662109375, 0.009613037109375, 0.025417327880859375, 0.04122161865234375, 0.057025909423828125, 0.0728302001953125, 0.08863449096679688, 0.10443878173828125, 0.12024307250976562, 0.13604736328125, 0.15185165405273438, 0.16765594482421875, 0.18346023559570312, 0.1992645263671875, 0.21506881713867188, 0.23087310791015625, 0.24667739868164062, 0.262481689453125, 0.2782859802246094, 0.29409027099609375, 0.3098945617675781, 0.3256988525390625, 0.3415031433105469, 0.35730743408203125, 0.3731117248535156, 0.388916015625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 8.0, 12.0, 22.0, 17.0, 32.0, 28.0, 53.0, 74.0, 78.0, 114.0, 131.0, 113.0, 72.0, 60.0, 61.0, 37.0, 31.0, 21.0, 15.0, 10.0, 11.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010263919830322266, -0.0001000305637717247, -9.742192924022675e-05, -9.481329470872879e-05, -9.220466017723083e-05, -8.959602564573288e-05, -8.698739111423492e-05, -8.437875658273697e-05, -8.177012205123901e-05, -7.916148751974106e-05, -7.65528529882431e-05, -7.394421845674515e-05, -7.133558392524719e-05, -6.872694939374924e-05, -6.611831486225128e-05, -6.350968033075333e-05, -6.090104579925537e-05, -5.8292411267757416e-05, -5.568377673625946e-05, -5.3075142204761505e-05, -5.046650767326355e-05, -4.7857873141765594e-05, -4.524923861026764e-05, -4.2640604078769684e-05, -4.003196954727173e-05, -3.742333501577377e-05, -3.481470048427582e-05, -3.220606595277786e-05, -2.9597431421279907e-05, -2.6988796889781952e-05, -2.4380162358283997e-05, -2.177152782678604e-05, -1.9162893295288086e-05, -1.655425876379013e-05, -1.3945624232292175e-05, -1.133698970079422e-05, -8.728355169296265e-06, -6.119720637798309e-06, -3.511086106300354e-06, -9.024515748023987e-07, 1.7061829566955566e-06, 4.314817488193512e-06, 6.923452019691467e-06, 9.532086551189423e-06, 1.2140721082687378e-05, 1.4749355614185333e-05, 1.735799014568329e-05, 1.9966624677181244e-05, 2.25752592086792e-05, 2.5183893740177155e-05, 2.779252827167511e-05, 3.0401162803173065e-05, 3.300979733467102e-05, 3.5618431866168976e-05, 3.822706639766693e-05, 4.0835700929164886e-05, 4.344433546066284e-05, 4.60529699921608e-05, 4.866160452365875e-05, 5.127023905515671e-05, 5.387887358665466e-05, 5.648750811815262e-05, 5.9096142649650574e-05, 6.170477718114853e-05, 6.431341171264648e-05]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 4.0, 5.0, 3.0, 10.0, 12.0, 22.0, 30.0, 60.0, 122.0, 224.0, 490.0, 1569.0, 6826.0, 113582.0, 860452.0, 58036.0, 4946.0, 1293.0, 458.0, 192.0, 81.0, 55.0, 35.0, 13.0, 18.0, 8.0, 6.0, 6.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.296142578125, -0.2864036560058594, -0.27666473388671875, -0.2669258117675781, -0.2571868896484375, -0.24744796752929688, -0.23770904541015625, -0.22797012329101562, -0.218231201171875, -0.20849227905273438, -0.19875335693359375, -0.18901443481445312, -0.1792755126953125, -0.16953659057617188, -0.15979766845703125, -0.15005874633789062, -0.14031982421875, -0.13058090209960938, -0.12084197998046875, -0.11110305786132812, -0.1013641357421875, -0.09162521362304688, -0.08188629150390625, -0.07214736938476562, -0.062408447265625, -0.052669525146484375, -0.04293060302734375, -0.033191680908203125, -0.0234527587890625, -0.013713836669921875, -0.00397491455078125, 0.005764007568359375, 0.0155029296875, 0.025241851806640625, 0.03498077392578125, 0.044719696044921875, 0.0544586181640625, 0.06419754028320312, 0.07393646240234375, 0.08367538452148438, 0.093414306640625, 0.10315322875976562, 0.11289215087890625, 0.12263107299804688, 0.1323699951171875, 0.14210891723632812, 0.15184783935546875, 0.16158676147460938, 0.17132568359375, 0.18106460571289062, 0.19080352783203125, 0.20054244995117188, 0.2102813720703125, 0.22002029418945312, 0.22975921630859375, 0.23949813842773438, 0.249237060546875, 0.2589759826660156, 0.26871490478515625, 0.2784538269042969, 0.2881927490234375, 0.2979316711425781, 0.30767059326171875, 0.3174095153808594, 0.3271484375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 7.0, 1.0, 4.0, 10.0, 11.0, 24.0, 36.0, 52.0, 73.0, 93.0, 116.0, 121.0, 118.0, 92.0, 77.0, 63.0, 35.0, 20.0, 21.0, 4.0, 8.0, 8.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2467041015625, -0.23842430114746094, -0.23014450073242188, -0.2218647003173828, -0.21358489990234375, -0.2053050994873047, -0.19702529907226562, -0.18874549865722656, -0.1804656982421875, -0.17218589782714844, -0.16390609741210938, -0.1556262969970703, -0.14734649658203125, -0.1390666961669922, -0.13078689575195312, -0.12250709533691406, -0.114227294921875, -0.10594749450683594, -0.09766769409179688, -0.08938789367675781, -0.08110809326171875, -0.07282829284667969, -0.06454849243164062, -0.05626869201660156, -0.0479888916015625, -0.03970909118652344, -0.031429290771484375, -0.023149490356445312, -0.01486968994140625, -0.0065898895263671875, 0.001689910888671875, 0.009969711303710938, 0.01824951171875, 0.026529312133789062, 0.034809112548828125, 0.04308891296386719, 0.05136871337890625, 0.05964851379394531, 0.06792831420898438, 0.07620811462402344, 0.0844879150390625, 0.09276771545410156, 0.10104751586914062, 0.10932731628417969, 0.11760711669921875, 0.1258869171142578, 0.13416671752929688, 0.14244651794433594, 0.150726318359375, 0.15900611877441406, 0.16728591918945312, 0.1755657196044922, 0.18384552001953125, 0.1921253204345703, 0.20040512084960938, 0.20868492126464844, 0.2169647216796875, 0.22524452209472656, 0.23352432250976562, 0.2418041229248047, 0.25008392333984375, 0.2583637237548828, 0.2666435241699219, 0.27492332458496094, 0.283203125]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 2.0, 2.0, 11.0, 14.0, 30.0, 47.0, 82.0, 119.0, 170.0, 174.0, 139.0, 93.0, 60.0, 25.0, 13.0, 13.0, 5.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-5.522227764129639, -5.412898540496826, -5.3035688400268555, -5.194239616394043, -5.084909915924072, -4.97558069229126, -4.866250991821289, -4.756921768188477, -4.647592544555664, -4.538263320922852, -4.428933620452881, -4.319604396820068, -4.210274696350098, -4.100945472717285, -3.9916160106658936, -3.882286548614502, -3.7729570865631104, -3.6636276245117188, -3.554298162460327, -3.4449687004089355, -3.335639476776123, -3.2263100147247314, -3.11698055267334, -3.0076510906219482, -2.8983216285705566, -2.788992166519165, -2.6796627044677734, -2.570333480834961, -2.4610040187835693, -2.3516745567321777, -2.242345094680786, -2.1330156326293945, -2.023686170578003, -1.9143567085266113, -1.8050273656845093, -1.6956979036331177, -1.5863685607910156, -1.477039098739624, -1.3677096366882324, -1.2583801746368408, -1.1490508317947388, -1.0397213697433472, -0.9303920269012451, -0.8210625648498535, -0.7117331624031067, -0.6024037599563599, -0.49307429790496826, -0.38374489545822144, -0.2744154930114746, -0.1650860756635666, -0.05575665831565857, 0.053572773933410645, 0.16290217638015747, 0.2722315788269043, 0.3815610408782959, 0.4908904433250427, 0.6002198457717896, 0.7095492482185364, 0.8188786506652832, 0.9282081127166748, 1.0375375747680664, 1.1468669176101685, 1.25619637966156, 1.365525722503662, 1.4748551845550537]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 5.0, 4.0, 8.0, 10.0, 6.0, 15.0, 12.0, 13.0, 19.0, 15.0, 26.0, 29.0, 34.0, 40.0, 38.0, 51.0, 43.0, 59.0, 50.0, 54.0, 52.0, 48.0, 50.0, 42.0, 37.0, 36.0, 42.0, 36.0, 28.0, 23.0, 16.0, 10.0, 8.0, 8.0, 10.0, 8.0, 4.0, 2.0, 6.0, 3.0, 1.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5343985557556152, -2.4423270225524902, -2.3502554893493652, -2.2581839561462402, -2.1661124229431152, -2.0740408897399902, -1.9819693565368652, -1.8898978233337402, -1.7978262901306152, -1.7057547569274902, -1.6136832237243652, -1.5216116905212402, -1.4295401573181152, -1.3374686241149902, -1.2453970909118652, -1.1533255577087402, -1.0612541437149048, -0.9691826105117798, -0.8771110773086548, -0.7850395441055298, -0.6929680109024048, -0.6008964776992798, -0.5088250041007996, -0.41675347089767456, -0.32468193769454956, -0.23261040449142456, -0.14053888618946075, -0.04846736788749695, 0.04360416531562805, 0.13567569851875305, 0.22774720191955566, 0.31981873512268066, 0.41189026832580566, 0.5039618015289307, 0.5960333347320557, 0.6881048679351807, 0.7801764011383057, 0.8722479343414307, 0.9643194079399109, 1.0563910007476807, 1.1484625339508057, 1.2405340671539307, 1.3326056003570557, 1.4246771335601807, 1.5167486667633057, 1.6088201999664307, 1.7008917331695557, 1.7929632663726807, 1.8850346803665161, 1.9771062135696411, 2.0691776275634766, 2.1612491607666016, 2.2533206939697266, 2.3453922271728516, 2.4374637603759766, 2.5295352935791016, 2.6216068267822266, 2.7136783599853516, 2.8057498931884766, 2.8978214263916016, 2.9898929595947266, 3.0819644927978516, 3.1740360260009766, 3.2661075592041016, 3.3581790924072266]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 12.0, 9.0, 16.0, 32.0, 37.0, 83.0, 180.0, 337.0, 853.0, 3465.0, 30389.0, 4111215.0, 41693.0, 4079.0, 1059.0, 430.0, 177.0, 95.0, 43.0, 31.0, 19.0, 10.0, 7.0, 4.0, 9.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6513671875, -0.6277236938476562, -0.6040802001953125, -0.5804367065429688, -0.556793212890625, -0.5331497192382812, -0.5095062255859375, -0.48586273193359375, -0.46221923828125, -0.43857574462890625, -0.4149322509765625, -0.39128875732421875, -0.367645263671875, -0.34400177001953125, -0.3203582763671875, -0.29671478271484375, -0.2730712890625, -0.24942779541015625, -0.2257843017578125, -0.20214080810546875, -0.178497314453125, -0.15485382080078125, -0.1312103271484375, -0.10756683349609375, -0.08392333984375, -0.06027984619140625, -0.0366363525390625, -0.01299285888671875, 0.010650634765625, 0.03429412841796875, 0.0579376220703125, 0.08158111572265625, 0.105224609375, 0.12886810302734375, 0.1525115966796875, 0.17615509033203125, 0.199798583984375, 0.22344207763671875, 0.2470855712890625, 0.27072906494140625, 0.29437255859375, 0.31801605224609375, 0.3416595458984375, 0.36530303955078125, 0.388946533203125, 0.41259002685546875, 0.4362335205078125, 0.45987701416015625, 0.4835205078125, 0.5071640014648438, 0.5308074951171875, 0.5544509887695312, 0.578094482421875, 0.6017379760742188, 0.6253814697265625, 0.6490249633789062, 0.67266845703125, 0.6963119506835938, 0.7199554443359375, 0.7435989379882812, 0.767242431640625, 0.7908859252929688, 0.8145294189453125, 0.8381729125976562, 0.86181640625]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 2.0, 5.0, 7.0, 5.0, 17.0, 19.0, 28.0, 41.0, 64.0, 76.0, 83.0, 101.0, 105.0, 104.0, 77.0, 78.0, 55.0, 35.0, 34.0, 20.0, 15.0, 16.0, 9.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1805419921875, -0.17220115661621094, -0.16386032104492188, -0.1555194854736328, -0.14717864990234375, -0.1388378143310547, -0.13049697875976562, -0.12215614318847656, -0.1138153076171875, -0.10547447204589844, -0.09713363647460938, -0.08879280090332031, -0.08045196533203125, -0.07211112976074219, -0.06377029418945312, -0.05542945861816406, -0.047088623046875, -0.03874778747558594, -0.030406951904296875, -0.022066116333007812, -0.01372528076171875, -0.0053844451904296875, 0.002956390380859375, 0.011297225952148438, 0.0196380615234375, 0.027978897094726562, 0.036319732666015625, 0.04466056823730469, 0.05300140380859375, 0.06134223937988281, 0.06968307495117188, 0.07802391052246094, 0.08636474609375, 0.09470558166503906, 0.10304641723632812, 0.11138725280761719, 0.11972808837890625, 0.1280689239501953, 0.13640975952148438, 0.14475059509277344, 0.1530914306640625, 0.16143226623535156, 0.16977310180664062, 0.1781139373779297, 0.18645477294921875, 0.1947956085205078, 0.20313644409179688, 0.21147727966308594, 0.219818115234375, 0.22815895080566406, 0.23649978637695312, 0.2448406219482422, 0.25318145751953125, 0.2615222930908203, 0.2698631286621094, 0.27820396423339844, 0.2865447998046875, 0.29488563537597656, 0.3032264709472656, 0.3115673065185547, 0.31990814208984375, 0.3282489776611328, 0.3365898132324219, 0.34493064880371094, 0.353271484375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 3.0, 5.0, 3.0, 10.0, 14.0, 17.0, 41.0, 60.0, 118.0, 157.0, 276.0, 575.0, 948.0, 1875.0, 4273.0, 13271.0, 78377.0, 3869207.0, 192579.0, 21374.0, 5918.0, 2431.0, 1189.0, 671.0, 395.0, 208.0, 130.0, 69.0, 38.0, 16.0, 16.0, 11.0, 7.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2130126953125, -0.20318031311035156, -0.19334793090820312, -0.1835155487060547, -0.17368316650390625, -0.1638507843017578, -0.15401840209960938, -0.14418601989746094, -0.1343536376953125, -0.12452125549316406, -0.11468887329101562, -0.10485649108886719, -0.09502410888671875, -0.08519172668457031, -0.07535934448242188, -0.06552696228027344, -0.055694580078125, -0.04586219787597656, -0.036029815673828125, -0.026197433471679688, -0.01636505126953125, -0.0065326690673828125, 0.003299713134765625, 0.013132095336914062, 0.0229644775390625, 0.03279685974121094, 0.042629241943359375, 0.05246162414550781, 0.06229400634765625, 0.07212638854980469, 0.08195877075195312, 0.09179115295410156, 0.10162353515625, 0.11145591735839844, 0.12128829956054688, 0.1311206817626953, 0.14095306396484375, 0.1507854461669922, 0.16061782836914062, 0.17045021057128906, 0.1802825927734375, 0.19011497497558594, 0.19994735717773438, 0.2097797393798828, 0.21961212158203125, 0.2294445037841797, 0.23927688598632812, 0.24910926818847656, 0.258941650390625, 0.26877403259277344, 0.2786064147949219, 0.2884387969970703, 0.29827117919921875, 0.3081035614013672, 0.3179359436035156, 0.32776832580566406, 0.3376007080078125, 0.34743309020996094, 0.3572654724121094, 0.3670978546142578, 0.37693023681640625, 0.3867626190185547, 0.3965950012207031, 0.40642738342285156, 0.416259765625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 4.0, 1.0, 6.0, 4.0, 4.0, 5.0, 15.0, 34.0, 53.0, 130.0, 435.0, 2986.0, 239.0, 75.0, 41.0, 23.0, 8.0, 7.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07293701171875, -0.06980037689208984, -0.06666374206542969, -0.06352710723876953, -0.060390472412109375, -0.05725383758544922, -0.05411720275878906, -0.050980567932128906, -0.04784393310546875, -0.044707298278808594, -0.04157066345214844, -0.03843402862548828, -0.035297393798828125, -0.03216075897216797, -0.029024124145507812, -0.025887489318847656, -0.0227508544921875, -0.019614219665527344, -0.016477584838867188, -0.013340950012207031, -0.010204315185546875, -0.007067680358886719, -0.0039310455322265625, -0.0007944107055664062, 0.00234222412109375, 0.005478858947753906, 0.008615493774414062, 0.011752128601074219, 0.014888763427734375, 0.01802539825439453, 0.021162033081054688, 0.024298667907714844, 0.027435302734375, 0.030571937561035156, 0.03370857238769531, 0.03684520721435547, 0.039981842041015625, 0.04311847686767578, 0.04625511169433594, 0.049391746520996094, 0.05252838134765625, 0.055665016174316406, 0.05880165100097656, 0.06193828582763672, 0.06507492065429688, 0.06821155548095703, 0.07134819030761719, 0.07448482513427734, 0.0776214599609375, 0.08075809478759766, 0.08389472961425781, 0.08703136444091797, 0.09016799926757812, 0.09330463409423828, 0.09644126892089844, 0.0995779037475586, 0.10271453857421875, 0.1058511734008789, 0.10898780822753906, 0.11212444305419922, 0.11526107788085938, 0.11839771270751953, 0.12153434753417969, 0.12467098236083984, 0.1278076171875]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 5.0, 5.0, 6.0, 9.0, 6.0, 22.0, 26.0, 39.0, 73.0, 92.0, 112.0, 117.0, 96.0, 111.0, 89.0, 61.0, 48.0, 39.0, 19.0, 12.0, 8.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.27748343348503113, -0.269666463136673, -0.2618495225906372, -0.25403255224227905, -0.2462155818939209, -0.23839862644672394, -0.23058167099952698, -0.22276470065116882, -0.21494773030281067, -0.2071307748556137, -0.19931380450725555, -0.1914968490600586, -0.18367987871170044, -0.17586292326450348, -0.16804596781730652, -0.16022899746894836, -0.1524120420217514, -0.14459508657455444, -0.1367781162261963, -0.12896116077899933, -0.12114419043064117, -0.11332723498344421, -0.10551027208566666, -0.0976933091878891, -0.08987634629011154, -0.08205938339233398, -0.07424242049455643, -0.06642545759677887, -0.05860849842429161, -0.05079153552651405, -0.042974576354026794, -0.03515761345624924, -0.027340665459632874, -0.019523702561855316, -0.011706741526722908, -0.0038897804915905, 0.0039271824061870575, 0.011744145303964615, 0.019561104476451874, 0.02737806737422943, 0.03519503027200699, 0.043011993169784546, 0.0508289560675621, 0.05864591524004936, 0.06646287441253662, 0.07427984476089478, 0.08209680020809174, 0.0899137631058693, 0.09773072600364685, 0.10554768890142441, 0.11336465179920197, 0.12118160724639893, 0.12899857759475708, 0.13681553304195404, 0.144632488489151, 0.15244945883750916, 0.1602664291858673, 0.16808338463306427, 0.17590035498142242, 0.18371731042861938, 0.19153428077697754, 0.1993512362241745, 0.20716819167137146, 0.21498516201972961, 0.22280211746692657]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 6.0, 7.0, 4.0, 8.0, 14.0, 12.0, 19.0, 25.0, 22.0, 24.0, 27.0, 38.0, 37.0, 50.0, 47.0, 36.0, 49.0, 50.0, 54.0, 41.0, 49.0, 56.0, 41.0, 44.0, 47.0, 29.0, 30.0, 32.0, 18.0, 25.0, 12.0, 8.0, 6.0, 8.0, 3.0, 8.0, 3.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0], "bins": [-0.18881118297576904, -0.1834801435470581, -0.17814911901950836, -0.17281809449195862, -0.16748705506324768, -0.16215601563453674, -0.156824991106987, -0.15149396657943726, -0.14616292715072632, -0.14083188772201538, -0.13550086319446564, -0.1301698386669159, -0.12483879923820496, -0.11950776726007462, -0.11417673528194427, -0.10884570330381393, -0.1035146713256836, -0.09818363934755325, -0.09285260736942291, -0.08752157539129257, -0.08219054341316223, -0.07685951143503189, -0.07152847945690155, -0.06619744747877121, -0.06086641550064087, -0.05553538352251053, -0.05020435154438019, -0.04487331956624985, -0.03954228758811951, -0.034211255609989166, -0.028880223631858826, -0.023549191653728485, -0.018218159675598145, -0.012887127697467804, -0.007556095719337463, -0.002225063741207123, 0.0031059682369232178, 0.008437000215053558, 0.013768032193183899, 0.01909906417131424, 0.02443009614944458, 0.02976112812757492, 0.03509216010570526, 0.0404231920838356, 0.04575422406196594, 0.05108525604009628, 0.056416288018226624, 0.061747319996356964, 0.0670783519744873, 0.07240938395261765, 0.07774041593074799, 0.08307144790887833, 0.08840247988700867, 0.09373351186513901, 0.09906454384326935, 0.10439557582139969, 0.10972660779953003, 0.11505763977766037, 0.12038867175579071, 0.12571969628334045, 0.1310507357120514, 0.13638177514076233, 0.14171279966831207, 0.14704382419586182, 0.15237486362457275]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 11.0, 14.0, 11.0, 22.0, 38.0, 56.0, 98.0, 203.0, 511.0, 1495.0, 7078.0, 72822.0, 755439.0, 193431.0, 13774.0, 2312.0, 679.0, 270.0, 127.0, 72.0, 36.0, 19.0, 11.0, 10.0, 4.0, 3.0, 2.0, 1.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.351806640625, -0.3355674743652344, -0.31932830810546875, -0.3030891418457031, -0.2868499755859375, -0.2706108093261719, -0.25437164306640625, -0.23813247680664062, -0.221893310546875, -0.20565414428710938, -0.18941497802734375, -0.17317581176757812, -0.1569366455078125, -0.14069747924804688, -0.12445831298828125, -0.10821914672851562, -0.09197998046875, -0.07574081420898438, -0.05950164794921875, -0.043262481689453125, -0.0270233154296875, -0.010784149169921875, 0.00545501708984375, 0.021694183349609375, 0.037933349609375, 0.054172515869140625, 0.07041168212890625, 0.08665084838867188, 0.1028900146484375, 0.11912918090820312, 0.13536834716796875, 0.15160751342773438, 0.1678466796875, 0.18408584594726562, 0.20032501220703125, 0.21656417846679688, 0.2328033447265625, 0.24904251098632812, 0.26528167724609375, 0.2815208435058594, 0.297760009765625, 0.3139991760253906, 0.33023834228515625, 0.3464775085449219, 0.3627166748046875, 0.3789558410644531, 0.39519500732421875, 0.4114341735839844, 0.42767333984375, 0.4439125061035156, 0.46015167236328125, 0.4763908386230469, 0.4926300048828125, 0.5088691711425781, 0.5251083374023438, 0.5413475036621094, 0.557586669921875, 0.5738258361816406, 0.5900650024414062, 0.6063041687011719, 0.6225433349609375, 0.6387825012207031, 0.6550216674804688, 0.6712608337402344, 0.6875]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 9.0, 6.0, 10.0, 16.0, 23.0, 28.0, 48.0, 66.0, 105.0, 96.0, 89.0, 95.0, 106.0, 68.0, 79.0, 50.0, 28.0, 29.0, 17.0, 11.0, 11.0, 7.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1849365234375, -0.17658424377441406, -0.16823196411132812, -0.1598796844482422, -0.15152740478515625, -0.1431751251220703, -0.13482284545898438, -0.12647056579589844, -0.1181182861328125, -0.10976600646972656, -0.10141372680664062, -0.09306144714355469, -0.08470916748046875, -0.07635688781738281, -0.06800460815429688, -0.05965232849121094, -0.051300048828125, -0.04294776916503906, -0.034595489501953125, -0.026243209838867188, -0.01789093017578125, -0.009538650512695312, -0.001186370849609375, 0.0071659088134765625, 0.0155181884765625, 0.023870468139648438, 0.032222747802734375, 0.04057502746582031, 0.04892730712890625, 0.05727958679199219, 0.06563186645507812, 0.07398414611816406, 0.08233642578125, 0.09068870544433594, 0.09904098510742188, 0.10739326477050781, 0.11574554443359375, 0.12409782409667969, 0.13245010375976562, 0.14080238342285156, 0.1491546630859375, 0.15750694274902344, 0.16585922241210938, 0.1742115020751953, 0.18256378173828125, 0.1909160614013672, 0.19926834106445312, 0.20762062072753906, 0.215972900390625, 0.22432518005371094, 0.23267745971679688, 0.2410297393798828, 0.24938201904296875, 0.2577342987060547, 0.2660865783691406, 0.27443885803222656, 0.2827911376953125, 0.29114341735839844, 0.2994956970214844, 0.3078479766845703, 0.31620025634765625, 0.3245525360107422, 0.3329048156738281, 0.34125709533691406, 0.349609375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 5.0, 7.0, 14.0, 17.0, 29.0, 24.0, 26.0, 42.0, 75.0, 128.0, 227.0, 532.0, 1482.0, 8501.0, 361539.0, 659902.0, 12716.0, 1931.0, 696.0, 242.0, 131.0, 76.0, 62.0, 42.0, 23.0, 20.0, 15.0, 13.0, 7.0, 6.0, 8.0, 3.0, 1.0, 3.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.72021484375, -0.6990814208984375, -0.677947998046875, -0.6568145751953125, -0.63568115234375, -0.6145477294921875, -0.593414306640625, -0.5722808837890625, -0.5511474609375, -0.5300140380859375, -0.508880615234375, -0.4877471923828125, -0.46661376953125, -0.4454803466796875, -0.424346923828125, -0.4032135009765625, -0.382080078125, -0.3609466552734375, -0.339813232421875, -0.3186798095703125, -0.29754638671875, -0.2764129638671875, -0.255279541015625, -0.2341461181640625, -0.2130126953125, -0.1918792724609375, -0.170745849609375, -0.1496124267578125, -0.12847900390625, -0.1073455810546875, -0.086212158203125, -0.0650787353515625, -0.0439453125, -0.0228118896484375, -0.001678466796875, 0.0194549560546875, 0.04058837890625, 0.0617218017578125, 0.082855224609375, 0.1039886474609375, 0.1251220703125, 0.1462554931640625, 0.167388916015625, 0.1885223388671875, 0.20965576171875, 0.2307891845703125, 0.251922607421875, 0.2730560302734375, 0.294189453125, 0.3153228759765625, 0.336456298828125, 0.3575897216796875, 0.37872314453125, 0.3998565673828125, 0.420989990234375, 0.4421234130859375, 0.4632568359375, 0.4843902587890625, 0.505523681640625, 0.5266571044921875, 0.54779052734375, 0.5689239501953125, 0.590057373046875, 0.6111907958984375, 0.63232421875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 4.0, 2.0, 4.0, 3.0, 12.0, 10.0, 10.0, 10.0, 19.0, 14.0, 26.0, 26.0, 21.0, 49.0, 35.0, 35.0, 40.0, 45.0, 44.0, 55.0, 41.0, 47.0, 58.0, 50.0, 33.0, 33.0, 41.0, 32.0, 39.0, 25.0, 26.0, 24.0, 22.0, 13.0, 15.0, 10.0, 10.0, 4.0, 5.0, 2.0, 4.0, 4.0, 3.0, 3.0, 0.0, 2.0, 3.0, 2.0], "bins": [-0.65625, -0.6384353637695312, -0.6206207275390625, -0.6028060913085938, -0.584991455078125, -0.5671768188476562, -0.5493621826171875, -0.5315475463867188, -0.51373291015625, -0.49591827392578125, -0.4781036376953125, -0.46028900146484375, -0.442474365234375, -0.42465972900390625, -0.4068450927734375, -0.38903045654296875, -0.3712158203125, -0.35340118408203125, -0.3355865478515625, -0.31777191162109375, -0.299957275390625, -0.28214263916015625, -0.2643280029296875, -0.24651336669921875, -0.22869873046875, -0.21088409423828125, -0.1930694580078125, -0.17525482177734375, -0.157440185546875, -0.13962554931640625, -0.1218109130859375, -0.10399627685546875, -0.086181640625, -0.06836700439453125, -0.0505523681640625, -0.03273773193359375, -0.014923095703125, 0.00289154052734375, 0.0207061767578125, 0.03852081298828125, 0.05633544921875, 0.07415008544921875, 0.0919647216796875, 0.10977935791015625, 0.127593994140625, 0.14540863037109375, 0.1632232666015625, 0.18103790283203125, 0.1988525390625, 0.21666717529296875, 0.2344818115234375, 0.25229644775390625, 0.270111083984375, 0.28792572021484375, 0.3057403564453125, 0.32355499267578125, 0.34136962890625, 0.35918426513671875, 0.3769989013671875, 0.39481353759765625, 0.412628173828125, 0.43044281005859375, 0.4482574462890625, 0.46607208251953125, 0.48388671875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 3.0, 8.0, 18.0, 31.0, 87.0, 423.0, 3973.0, 1011478.0, 31275.0, 957.0, 195.0, 54.0, 26.0, 13.0, 7.0, 0.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7900390625, -0.7696304321289062, -0.7492218017578125, -0.7288131713867188, -0.708404541015625, -0.6879959106445312, -0.6675872802734375, -0.6471786499023438, -0.62677001953125, -0.6063613891601562, -0.5859527587890625, -0.5655441284179688, -0.545135498046875, -0.5247268676757812, -0.5043182373046875, -0.48390960693359375, -0.4635009765625, -0.44309234619140625, -0.4226837158203125, -0.40227508544921875, -0.381866455078125, -0.36145782470703125, -0.3410491943359375, -0.32064056396484375, -0.30023193359375, -0.27982330322265625, -0.2594146728515625, -0.23900604248046875, -0.218597412109375, -0.19818878173828125, -0.1777801513671875, -0.15737152099609375, -0.136962890625, -0.11655426025390625, -0.0961456298828125, -0.07573699951171875, -0.055328369140625, -0.03491973876953125, -0.0145111083984375, 0.00589752197265625, 0.02630615234375, 0.04671478271484375, 0.0671234130859375, 0.08753204345703125, 0.107940673828125, 0.12834930419921875, 0.1487579345703125, 0.16916656494140625, 0.1895751953125, 0.20998382568359375, 0.2303924560546875, 0.25080108642578125, 0.271209716796875, 0.29161834716796875, 0.3120269775390625, 0.33243560791015625, 0.35284423828125, 0.37325286865234375, 0.3936614990234375, 0.41407012939453125, 0.434478759765625, 0.45488739013671875, 0.4752960205078125, 0.49570465087890625, 0.51611328125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 4.0, 3.0, 4.0, 5.0, 6.0, 8.0, 13.0, 23.0, 13.0, 20.0, 24.0, 16.0, 18.0, 26.0, 39.0, 65.0, 102.0, 68.0, 90.0, 94.0, 84.0, 60.0, 40.0, 53.0, 27.0, 16.0, 18.0, 16.0, 9.0, 7.0, 3.0, 6.0, 5.0, 3.0, 1.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.583597183227539e-05, -4.437938332557678e-05, -4.2922794818878174e-05, -4.1466206312179565e-05, -4.000961780548096e-05, -3.855302929878235e-05, -3.709644079208374e-05, -3.563985228538513e-05, -3.4183263778686523e-05, -3.2726675271987915e-05, -3.127008676528931e-05, -2.9813498258590698e-05, -2.835690975189209e-05, -2.690032124519348e-05, -2.5443732738494873e-05, -2.3987144231796265e-05, -2.2530555725097656e-05, -2.1073967218399048e-05, -1.961737871170044e-05, -1.816079020500183e-05, -1.6704201698303223e-05, -1.5247613191604614e-05, -1.3791024684906006e-05, -1.2334436178207397e-05, -1.0877847671508789e-05, -9.42125916481018e-06, -7.964670658111572e-06, -6.508082151412964e-06, -5.0514936447143555e-06, -3.594905138015747e-06, -2.1383166313171387e-06, -6.817281246185303e-07, 7.748603820800781e-07, 2.2314488887786865e-06, 3.688037395477295e-06, 5.144625902175903e-06, 6.601214408874512e-06, 8.05780291557312e-06, 9.514391422271729e-06, 1.0970979928970337e-05, 1.2427568435668945e-05, 1.3884156942367554e-05, 1.5340745449066162e-05, 1.679733395576477e-05, 1.825392246246338e-05, 1.9710510969161987e-05, 2.1167099475860596e-05, 2.2623687982559204e-05, 2.4080276489257812e-05, 2.553686499595642e-05, 2.699345350265503e-05, 2.8450042009353638e-05, 2.9906630516052246e-05, 3.1363219022750854e-05, 3.281980752944946e-05, 3.427639603614807e-05, 3.573298454284668e-05, 3.718957304954529e-05, 3.8646161556243896e-05, 4.0102750062942505e-05, 4.155933856964111e-05, 4.301592707633972e-05, 4.447251558303833e-05, 4.592910408973694e-05, 4.738569259643555e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 4.0, 13.0, 6.0, 13.0, 33.0, 56.0, 172.0, 514.0, 2456.0, 59857.0, 965500.0, 17770.0, 1538.0, 388.0, 111.0, 47.0, 26.0, 13.0, 16.0, 4.0, 4.0, 4.0, 7.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.541015625, -0.5288200378417969, -0.5166244506835938, -0.5044288635253906, -0.4922332763671875, -0.4800376892089844, -0.46784210205078125, -0.4556465148925781, -0.443450927734375, -0.4312553405761719, -0.41905975341796875, -0.4068641662597656, -0.3946685791015625, -0.3824729919433594, -0.37027740478515625, -0.3580818176269531, -0.34588623046875, -0.3336906433105469, -0.32149505615234375, -0.3092994689941406, -0.2971038818359375, -0.2849082946777344, -0.27271270751953125, -0.2605171203613281, -0.248321533203125, -0.23612594604492188, -0.22393035888671875, -0.21173477172851562, -0.1995391845703125, -0.18734359741210938, -0.17514801025390625, -0.16295242309570312, -0.1507568359375, -0.13856124877929688, -0.12636566162109375, -0.11417007446289062, -0.1019744873046875, -0.08977890014648438, -0.07758331298828125, -0.06538772583007812, -0.053192138671875, -0.040996551513671875, -0.02880096435546875, -0.016605377197265625, -0.0044097900390625, 0.007785797119140625, 0.01998138427734375, 0.032176971435546875, 0.04437255859375, 0.056568145751953125, 0.06876373291015625, 0.08095932006835938, 0.0931549072265625, 0.10535049438476562, 0.11754608154296875, 0.12974166870117188, 0.141937255859375, 0.15413284301757812, 0.16632843017578125, 0.17852401733398438, 0.1907196044921875, 0.20291519165039062, 0.21511077880859375, 0.22730636596679688, 0.239501953125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 8.0, 3.0, 6.0, 5.0, 13.0, 28.0, 40.0, 73.0, 99.0, 112.0, 137.0, 136.0, 108.0, 99.0, 53.0, 33.0, 18.0, 12.0, 9.0, 3.0, 6.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.277099609375, -0.2695655822753906, -0.26203155517578125, -0.2544975280761719, -0.2469635009765625, -0.23942947387695312, -0.23189544677734375, -0.22436141967773438, -0.216827392578125, -0.20929336547851562, -0.20175933837890625, -0.19422531127929688, -0.1866912841796875, -0.17915725708007812, -0.17162322998046875, -0.16408920288085938, -0.15655517578125, -0.14902114868164062, -0.14148712158203125, -0.13395309448242188, -0.1264190673828125, -0.11888504028320312, -0.11135101318359375, -0.10381698608398438, -0.096282958984375, -0.08874893188476562, -0.08121490478515625, -0.07368087768554688, -0.0661468505859375, -0.058612823486328125, -0.05107879638671875, -0.043544769287109375, -0.0360107421875, -0.028476715087890625, -0.02094268798828125, -0.013408660888671875, -0.0058746337890625, 0.001659393310546875, 0.00919342041015625, 0.016727447509765625, 0.024261474609375, 0.031795501708984375, 0.03932952880859375, 0.046863555908203125, 0.0543975830078125, 0.061931610107421875, 0.06946563720703125, 0.07699966430664062, 0.08453369140625, 0.09206771850585938, 0.09960174560546875, 0.10713577270507812, 0.1146697998046875, 0.12220382690429688, 0.12973785400390625, 0.13727188110351562, 0.144805908203125, 0.15233993530273438, 0.15987396240234375, 0.16740798950195312, 0.1749420166015625, 0.18247604370117188, 0.19001007080078125, 0.19754409790039062, 0.205078125]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 8.0, 21.0, 58.0, 216.0, 343.0, 243.0, 86.0, 18.0, 8.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.959199905395508, -5.786752223968506, -5.614304542541504, -5.441856861114502, -5.2694091796875, -5.096961498260498, -4.924513816833496, -4.752066135406494, -4.579618453979492, -4.40717077255249, -4.234723091125488, -4.062275409698486, -3.8898277282714844, -3.7173800468444824, -3.5449323654174805, -3.3724846839904785, -3.2000370025634766, -3.0275893211364746, -2.8551416397094727, -2.6826939582824707, -2.5102462768554688, -2.337798595428467, -2.165350914001465, -1.992903232574463, -1.820455551147461, -1.648007869720459, -1.475560188293457, -1.303112506866455, -1.1306648254394531, -0.9582171440124512, -0.7857694625854492, -0.6133217811584473, -0.4408740997314453, -0.26842641830444336, -0.0959787368774414, 0.07646894454956055, 0.2489166259765625, 0.42136430740356445, 0.5938119888305664, 0.7662596702575684, 0.9387073516845703, 1.1111550331115723, 1.2836027145385742, 1.4560503959655762, 1.6284980773925781, 1.80094575881958, 1.973393440246582, 2.145841121673584, 2.318288803100586, 2.490736484527588, 2.66318416595459, 2.835631847381592, 3.0080795288085938, 3.1805272102355957, 3.3529748916625977, 3.5254225730895996, 3.6978702545166016, 3.8703179359436035, 4.0427656173706055, 4.215213298797607, 4.387660980224609, 4.560108661651611, 4.732556343078613, 4.905004024505615, 5.077451705932617]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 4.0, 7.0, 8.0, 10.0, 15.0, 16.0, 18.0, 26.0, 30.0, 32.0, 41.0, 50.0, 47.0, 52.0, 60.0, 55.0, 83.0, 64.0, 60.0, 43.0, 50.0, 43.0, 38.0, 27.0, 31.0, 25.0, 18.0, 14.0, 8.0, 8.0, 7.0, 5.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.4693262577056885, -3.373845100402832, -3.2783639430999756, -3.182882785797119, -3.087401866912842, -2.9919207096099854, -2.896439552307129, -2.8009583950042725, -2.705477237701416, -2.6099960803985596, -2.514514923095703, -2.4190337657928467, -2.3235526084899902, -2.228071689605713, -2.1325905323028564, -2.037109375, -1.9416282176971436, -1.846147060394287, -1.7506659030914307, -1.6551848649978638, -1.5597037076950073, -1.4642225503921509, -1.368741512298584, -1.2732603549957275, -1.177779197692871, -1.0822980403900146, -0.986816942691803, -0.8913358449935913, -0.7958546876907349, -0.7003735303878784, -0.6048924326896667, -0.5094113349914551, -0.41392993927001953, -0.3184488117694855, -0.22296768426895142, -0.12748655676841736, -0.0320054292678833, 0.06347569823265076, 0.15895682573318481, 0.2544379234313965, 0.34991908073425293, 0.445400208234787, 0.540881335735321, 0.6363624334335327, 0.7318435907363892, 0.8273247480392456, 0.9228058457374573, 1.018286943435669, 1.1137681007385254, 1.2092492580413818, 1.3047304153442383, 1.4002114534378052, 1.4956926107406616, 1.591173768043518, 1.686654806137085, 1.7821359634399414, 1.8776171207427979, 1.9730982780456543, 2.0685794353485107, 2.164060592651367, 2.2595415115356445, 2.355022668838501, 2.4505038261413574, 2.545984983444214, 2.6414661407470703]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 13.0, 4.0, 12.0, 18.0, 51.0, 85.0, 166.0, 364.0, 820.0, 2197.0, 8513.0, 73408.0, 3996158.0, 98321.0, 10029.0, 2495.0, 898.0, 381.0, 182.0, 81.0, 45.0, 16.0, 12.0, 4.0, 2.0, 2.0, 9.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.57470703125, -0.5611991882324219, -0.5476913452148438, -0.5341835021972656, -0.5206756591796875, -0.5071678161621094, -0.49365997314453125, -0.4801521301269531, -0.466644287109375, -0.4531364440917969, -0.43962860107421875, -0.4261207580566406, -0.4126129150390625, -0.3991050720214844, -0.38559722900390625, -0.3720893859863281, -0.35858154296875, -0.3450736999511719, -0.33156585693359375, -0.3180580139160156, -0.3045501708984375, -0.2910423278808594, -0.27753448486328125, -0.2640266418457031, -0.250518798828125, -0.23701095581054688, -0.22350311279296875, -0.20999526977539062, -0.1964874267578125, -0.18297958374023438, -0.16947174072265625, -0.15596389770507812, -0.1424560546875, -0.12894821166992188, -0.11544036865234375, -0.10193252563476562, -0.0884246826171875, -0.07491683959960938, -0.06140899658203125, -0.047901153564453125, -0.034393310546875, -0.020885467529296875, -0.00737762451171875, 0.006130218505859375, 0.0196380615234375, 0.033145904541015625, 0.04665374755859375, 0.060161590576171875, 0.07366943359375, 0.08717727661132812, 0.10068511962890625, 0.11419296264648438, 0.1277008056640625, 0.14120864868164062, 0.15471649169921875, 0.16822433471679688, 0.181732177734375, 0.19524002075195312, 0.20874786376953125, 0.22225570678710938, 0.2357635498046875, 0.24927139282226562, 0.26277923583984375, 0.2762870788574219, 0.289794921875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 7.0, 10.0, 9.0, 15.0, 19.0, 29.0, 37.0, 56.0, 59.0, 81.0, 78.0, 84.0, 84.0, 76.0, 68.0, 53.0, 60.0, 46.0, 42.0, 21.0, 19.0, 15.0, 9.0, 8.0, 6.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17919921875, -0.17284584045410156, -0.16649246215820312, -0.1601390838623047, -0.15378570556640625, -0.1474323272705078, -0.14107894897460938, -0.13472557067871094, -0.1283721923828125, -0.12201881408691406, -0.11566543579101562, -0.10931205749511719, -0.10295867919921875, -0.09660530090332031, -0.09025192260742188, -0.08389854431152344, -0.077545166015625, -0.07119178771972656, -0.06483840942382812, -0.05848503112792969, -0.05213165283203125, -0.04577827453613281, -0.039424896240234375, -0.03307151794433594, -0.0267181396484375, -0.020364761352539062, -0.014011383056640625, -0.0076580047607421875, -0.00130462646484375, 0.0050487518310546875, 0.011402130126953125, 0.017755508422851562, 0.02410888671875, 0.030462265014648438, 0.036815643310546875, 0.04316902160644531, 0.04952239990234375, 0.05587577819824219, 0.062229156494140625, 0.06858253479003906, 0.0749359130859375, 0.08128929138183594, 0.08764266967773438, 0.09399604797363281, 0.10034942626953125, 0.10670280456542969, 0.11305618286132812, 0.11940956115722656, 0.125762939453125, 0.13211631774902344, 0.13846969604492188, 0.1448230743408203, 0.15117645263671875, 0.1575298309326172, 0.16388320922851562, 0.17023658752441406, 0.1765899658203125, 0.18294334411621094, 0.18929672241210938, 0.1956501007080078, 0.20200347900390625, 0.2083568572998047, 0.21471023559570312, 0.22106361389160156, 0.2274169921875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 4.0, 2.0, 2.0, 7.0, 4.0, 5.0, 11.0, 15.0, 16.0, 27.0, 31.0, 28.0, 48.0, 71.0, 93.0, 146.0, 248.0, 390.0, 652.0, 1169.0, 2192.0, 4137.0, 8773.0, 22279.0, 78036.0, 680359.0, 3203491.0, 135978.0, 32822.0, 11866.0, 5235.0, 2620.0, 1419.0, 777.0, 442.0, 286.0, 167.0, 129.0, 73.0, 56.0, 50.0, 36.0, 27.0, 23.0, 16.0, 13.0, 6.0, 3.0, 3.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.14990234375, -0.14493370056152344, -0.13996505737304688, -0.1349964141845703, -0.13002777099609375, -0.1250591278076172, -0.12009048461914062, -0.11512184143066406, -0.1101531982421875, -0.10518455505371094, -0.10021591186523438, -0.09524726867675781, -0.09027862548828125, -0.08530998229980469, -0.08034133911132812, -0.07537269592285156, -0.070404052734375, -0.06543540954589844, -0.060466766357421875, -0.05549812316894531, -0.05052947998046875, -0.04556083679199219, -0.040592193603515625, -0.03562355041503906, -0.0306549072265625, -0.025686264038085938, -0.020717620849609375, -0.015748977661132812, -0.01078033447265625, -0.0058116912841796875, -0.000843048095703125, 0.0041255950927734375, 0.00909423828125, 0.014062881469726562, 0.019031524658203125, 0.024000167846679688, 0.02896881103515625, 0.03393745422363281, 0.038906097412109375, 0.04387474060058594, 0.0488433837890625, 0.05381202697753906, 0.058780670166015625, 0.06374931335449219, 0.06871795654296875, 0.07368659973144531, 0.07865524291992188, 0.08362388610839844, 0.088592529296875, 0.09356117248535156, 0.09852981567382812, 0.10349845886230469, 0.10846710205078125, 0.11343574523925781, 0.11840438842773438, 0.12337303161621094, 0.1283416748046875, 0.13331031799316406, 0.13827896118164062, 0.1432476043701172, 0.14821624755859375, 0.1531848907470703, 0.15815353393554688, 0.16312217712402344, 0.1680908203125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 5.0, 10.0, 9.0, 9.0, 24.0, 32.0, 55.0, 116.0, 322.0, 2361.0, 745.0, 186.0, 87.0, 47.0, 26.0, 15.0, 10.0, 3.0, 6.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0870361328125, -0.08263015747070312, -0.07822418212890625, -0.07381820678710938, -0.0694122314453125, -0.06500625610351562, -0.06060028076171875, -0.056194305419921875, -0.051788330078125, -0.047382354736328125, -0.04297637939453125, -0.038570404052734375, -0.0341644287109375, -0.029758453369140625, -0.02535247802734375, -0.020946502685546875, -0.01654052734375, -0.012134552001953125, -0.00772857666015625, -0.003322601318359375, 0.0010833740234375, 0.005489349365234375, 0.00989532470703125, 0.014301300048828125, 0.018707275390625, 0.023113250732421875, 0.02751922607421875, 0.031925201416015625, 0.0363311767578125, 0.040737152099609375, 0.04514312744140625, 0.049549102783203125, 0.053955078125, 0.058361053466796875, 0.06276702880859375, 0.06717300415039062, 0.0715789794921875, 0.07598495483398438, 0.08039093017578125, 0.08479690551757812, 0.089202880859375, 0.09360885620117188, 0.09801483154296875, 0.10242080688476562, 0.1068267822265625, 0.11123275756835938, 0.11563873291015625, 0.12004470825195312, 0.12445068359375, 0.12885665893554688, 0.13326263427734375, 0.13766860961914062, 0.1420745849609375, 0.14648056030273438, 0.15088653564453125, 0.15529251098632812, 0.159698486328125, 0.16410446166992188, 0.16851043701171875, 0.17291641235351562, 0.1773223876953125, 0.18172836303710938, 0.18613433837890625, 0.19054031372070312, 0.1949462890625]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 5.0, 7.0, 18.0, 34.0, 75.0, 116.0, 200.0, 188.0, 171.0, 103.0, 56.0, 12.0, 9.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.9666217565536499, -0.9421549439430237, -0.9176881909370422, -0.893221378326416, -0.8687546253204346, -0.8442878127098083, -0.8198210000991821, -0.7953542470932007, -0.7708874344825745, -0.7464206218719482, -0.7219538688659668, -0.6974870562553406, -0.6730203032493591, -0.6485534906387329, -0.6240867376327515, -0.5996199250221252, -0.575153112411499, -0.5506862998008728, -0.5262195467948914, -0.5017527341842651, -0.4772859513759613, -0.45281916856765747, -0.42835238575935364, -0.4038856029510498, -0.37941884994506836, -0.3549520671367645, -0.3304852843284607, -0.3060184717178345, -0.28155168890953064, -0.2570849061012268, -0.23261812329292297, -0.20815132558345795, -0.18368452787399292, -0.1592177450656891, -0.13475094735622406, -0.11028416454792023, -0.0858173742890358, -0.06135058403015137, -0.036883801221847534, -0.012417003512382507, 0.012049779295921326, 0.036516569554805756, 0.06098335608839989, 0.08545014262199402, 0.10991693288087845, 0.13438372313976288, 0.1588505059480667, 0.18331730365753174, 0.20778408646583557, 0.2322508692741394, 0.25671765208244324, 0.28118443489074707, 0.3056512475013733, 0.3301180303096771, 0.35458481311798096, 0.3790516257286072, 0.4035183787345886, 0.42798516154289246, 0.4524519443511963, 0.4769187569618225, 0.501385509967804, 0.5258523225784302, 0.5503190755844116, 0.5747858881950378, 0.5992527008056641]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 2.0, 5.0, 3.0, 5.0, 3.0, 6.0, 13.0, 21.0, 15.0, 29.0, 24.0, 24.0, 28.0, 22.0, 23.0, 35.0, 55.0, 41.0, 40.0, 55.0, 64.0, 34.0, 54.0, 47.0, 55.0, 42.0, 42.0, 35.0, 30.0, 32.0, 21.0, 24.0, 15.0, 13.0, 9.0, 12.0, 5.0, 4.0, 10.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.29025834798812866, -0.28041642904281616, -0.27057451009750366, -0.26073259115219116, -0.25089070200920105, -0.24104878306388855, -0.23120686411857605, -0.22136494517326355, -0.21152302622795105, -0.20168110728263855, -0.19183920323848724, -0.18199728429317474, -0.17215536534786224, -0.16231346130371094, -0.15247154235839844, -0.14262962341308594, -0.13278771936893463, -0.12294580787420273, -0.11310388892889023, -0.10326197743415833, -0.09342005848884583, -0.08357814699411392, -0.07373623549938202, -0.06389431655406952, -0.054052405059337616, -0.044210489839315414, -0.03436857461929321, -0.02452666312456131, -0.014684747904539108, -0.004842832684516907, 0.004999078810214996, 0.014840997755527496, 0.0246829092502594, 0.0345248244702816, 0.0443667396903038, 0.054208651185035706, 0.0640505701303482, 0.07389248162508011, 0.08373439311981201, 0.09357631206512451, 0.10341822355985641, 0.11326013505458832, 0.12310205399990082, 0.13294395804405212, 0.14278587698936462, 0.15262779593467712, 0.16246971487998962, 0.17231163382530212, 0.18215353786945343, 0.19199545681476593, 0.20183736085891724, 0.21167927980422974, 0.22152119874954224, 0.23136311769485474, 0.24120502173900604, 0.25104695558547974, 0.26088884472846985, 0.27073076367378235, 0.28057268261909485, 0.29041457176208496, 0.30025649070739746, 0.31009840965270996, 0.31994032859802246, 0.32978224754333496, 0.33962416648864746]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 0.0, 3.0, 8.0, 11.0, 22.0, 24.0, 51.0, 95.0, 192.0, 567.0, 2326.0, 20232.0, 485038.0, 515061.0, 21550.0, 2376.0, 581.0, 187.0, 104.0, 41.0, 30.0, 16.0, 16.0, 5.0, 4.0, 5.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.75048828125, -0.7312507629394531, -0.7120132446289062, -0.6927757263183594, -0.6735382080078125, -0.6543006896972656, -0.6350631713867188, -0.6158256530761719, -0.596588134765625, -0.5773506164550781, -0.5581130981445312, -0.5388755798339844, -0.5196380615234375, -0.5004005432128906, -0.48116302490234375, -0.4619255065917969, -0.44268798828125, -0.4234504699707031, -0.40421295166015625, -0.3849754333496094, -0.3657379150390625, -0.3465003967285156, -0.32726287841796875, -0.3080253601074219, -0.288787841796875, -0.2695503234863281, -0.25031280517578125, -0.23107528686523438, -0.2118377685546875, -0.19260025024414062, -0.17336273193359375, -0.15412521362304688, -0.1348876953125, -0.11565017700195312, -0.09641265869140625, -0.07717514038085938, -0.0579376220703125, -0.038700103759765625, -0.01946258544921875, -0.000225067138671875, 0.019012451171875, 0.038249969482421875, 0.05748748779296875, 0.07672500610351562, 0.0959625244140625, 0.11520004272460938, 0.13443756103515625, 0.15367507934570312, 0.17291259765625, 0.19215011596679688, 0.21138763427734375, 0.23062515258789062, 0.2498626708984375, 0.2691001892089844, 0.28833770751953125, 0.3075752258300781, 0.326812744140625, 0.3460502624511719, 0.36528778076171875, 0.3845252990722656, 0.4037628173828125, 0.4230003356933594, 0.44223785400390625, 0.4614753723144531, 0.480712890625]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 3.0, 4.0, 14.0, 14.0, 19.0, 25.0, 54.0, 47.0, 52.0, 80.0, 86.0, 60.0, 84.0, 73.0, 80.0, 71.0, 50.0, 45.0, 50.0, 22.0, 18.0, 17.0, 8.0, 10.0, 6.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.177490234375, -0.17122268676757812, -0.16495513916015625, -0.15868759155273438, -0.1524200439453125, -0.14615249633789062, -0.13988494873046875, -0.13361740112304688, -0.127349853515625, -0.12108230590820312, -0.11481475830078125, -0.10854721069335938, -0.1022796630859375, -0.09601211547851562, -0.08974456787109375, -0.08347702026367188, -0.07720947265625, -0.07094192504882812, -0.06467437744140625, -0.058406829833984375, -0.0521392822265625, -0.045871734619140625, -0.03960418701171875, -0.033336639404296875, -0.027069091796875, -0.020801544189453125, -0.01453399658203125, -0.008266448974609375, -0.0019989013671875, 0.004268646240234375, 0.01053619384765625, 0.016803741455078125, 0.0230712890625, 0.029338836669921875, 0.03560638427734375, 0.041873931884765625, 0.0481414794921875, 0.054409027099609375, 0.06067657470703125, 0.06694412231445312, 0.073211669921875, 0.07947921752929688, 0.08574676513671875, 0.09201431274414062, 0.0982818603515625, 0.10454940795898438, 0.11081695556640625, 0.11708450317382812, 0.12335205078125, 0.12961959838867188, 0.13588714599609375, 0.14215469360351562, 0.1484222412109375, 0.15468978881835938, 0.16095733642578125, 0.16722488403320312, 0.173492431640625, 0.17975997924804688, 0.18602752685546875, 0.19229507446289062, 0.1985626220703125, 0.20483016967773438, 0.21109771728515625, 0.21736526489257812, 0.2236328125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 2.0, 3.0, 3.0, 10.0, 8.0, 11.0, 19.0, 27.0, 32.0, 64.0, 89.0, 164.0, 281.0, 592.0, 1651.0, 7942.0, 163100.0, 834160.0, 34853.0, 3478.0, 1004.0, 425.0, 273.0, 123.0, 84.0, 42.0, 28.0, 23.0, 20.0, 14.0, 5.0, 7.0, 8.0, 1.0, 3.0, 1.0, 4.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.61328125, -0.5948562622070312, -0.5764312744140625, -0.5580062866210938, -0.539581298828125, -0.5211563110351562, -0.5027313232421875, -0.48430633544921875, -0.46588134765625, -0.44745635986328125, -0.4290313720703125, -0.41060638427734375, -0.392181396484375, -0.37375640869140625, -0.3553314208984375, -0.33690643310546875, -0.3184814453125, -0.30005645751953125, -0.2816314697265625, -0.26320648193359375, -0.244781494140625, -0.22635650634765625, -0.2079315185546875, -0.18950653076171875, -0.17108154296875, -0.15265655517578125, -0.1342315673828125, -0.11580657958984375, -0.097381591796875, -0.07895660400390625, -0.0605316162109375, -0.04210662841796875, -0.023681640625, -0.00525665283203125, 0.0131683349609375, 0.03159332275390625, 0.050018310546875, 0.06844329833984375, 0.0868682861328125, 0.10529327392578125, 0.12371826171875, 0.14214324951171875, 0.1605682373046875, 0.17899322509765625, 0.197418212890625, 0.21584320068359375, 0.2342681884765625, 0.25269317626953125, 0.2711181640625, 0.28954315185546875, 0.3079681396484375, 0.32639312744140625, 0.344818115234375, 0.36324310302734375, 0.3816680908203125, 0.40009307861328125, 0.41851806640625, 0.43694305419921875, 0.4553680419921875, 0.47379302978515625, 0.492218017578125, 0.5106430053710938, 0.5290679931640625, 0.5474929809570312, 0.56591796875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 5.0, 7.0, 6.0, 6.0, 5.0, 11.0, 8.0, 15.0, 16.0, 24.0, 24.0, 17.0, 26.0, 23.0, 29.0, 55.0, 21.0, 53.0, 38.0, 30.0, 59.0, 43.0, 43.0, 44.0, 39.0, 48.0, 34.0, 41.0, 37.0, 24.0, 34.0, 25.0, 23.0, 13.0, 9.0, 13.0, 12.0, 1.0, 11.0, 6.0, 10.0, 8.0, 4.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.42138671875, -0.4075660705566406, -0.39374542236328125, -0.3799247741699219, -0.3661041259765625, -0.3522834777832031, -0.33846282958984375, -0.3246421813964844, -0.310821533203125, -0.2970008850097656, -0.28318023681640625, -0.2693595886230469, -0.2555389404296875, -0.24171829223632812, -0.22789764404296875, -0.21407699584960938, -0.20025634765625, -0.18643569946289062, -0.17261505126953125, -0.15879440307617188, -0.1449737548828125, -0.13115310668945312, -0.11733245849609375, -0.10351181030273438, -0.089691162109375, -0.07587051391601562, -0.06204986572265625, -0.048229217529296875, -0.0344085693359375, -0.020587921142578125, -0.00676727294921875, 0.007053375244140625, 0.0208740234375, 0.034694671630859375, 0.04851531982421875, 0.062335968017578125, 0.0761566162109375, 0.08997726440429688, 0.10379791259765625, 0.11761856079101562, 0.131439208984375, 0.14525985717773438, 0.15908050537109375, 0.17290115356445312, 0.1867218017578125, 0.20054244995117188, 0.21436309814453125, 0.22818374633789062, 0.24200439453125, 0.2558250427246094, 0.26964569091796875, 0.2834663391113281, 0.2972869873046875, 0.3111076354980469, 0.32492828369140625, 0.3387489318847656, 0.352569580078125, 0.3663902282714844, 0.38021087646484375, 0.3940315246582031, 0.4078521728515625, 0.4216728210449219, 0.43549346923828125, 0.4493141174316406, 0.463134765625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 4.0, 3.0, 8.0, 4.0, 5.0, 14.0, 27.0, 43.0, 63.0, 112.0, 234.0, 604.0, 1429.0, 5354.0, 36944.0, 678273.0, 300611.0, 19233.0, 3604.0, 1085.0, 453.0, 195.0, 101.0, 54.0, 39.0, 24.0, 10.0, 5.0, 4.0, 4.0, 4.0, 6.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1475830078125, -0.1420879364013672, -0.13659286499023438, -0.13109779357910156, -0.12560272216796875, -0.12010765075683594, -0.11461257934570312, -0.10911750793457031, -0.1036224365234375, -0.09812736511230469, -0.09263229370117188, -0.08713722229003906, -0.08164215087890625, -0.07614707946777344, -0.07065200805664062, -0.06515693664550781, -0.059661865234375, -0.05416679382324219, -0.048671722412109375, -0.04317665100097656, -0.03768157958984375, -0.03218650817871094, -0.026691436767578125, -0.021196365356445312, -0.0157012939453125, -0.010206222534179688, -0.004711151123046875, 0.0007839202880859375, 0.00627899169921875, 0.011774063110351562, 0.017269134521484375, 0.022764205932617188, 0.02825927734375, 0.03375434875488281, 0.039249420166015625, 0.04474449157714844, 0.05023956298828125, 0.05573463439941406, 0.061229705810546875, 0.06672477722167969, 0.0722198486328125, 0.07771492004394531, 0.08320999145507812, 0.08870506286621094, 0.09420013427734375, 0.09969520568847656, 0.10519027709960938, 0.11068534851074219, 0.116180419921875, 0.12167549133300781, 0.12717056274414062, 0.13266563415527344, 0.13816070556640625, 0.14365577697753906, 0.14915084838867188, 0.1546459197998047, 0.1601409912109375, 0.1656360626220703, 0.17113113403320312, 0.17662620544433594, 0.18212127685546875, 0.18761634826660156, 0.19311141967773438, 0.1986064910888672, 0.2041015625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 3.0, 0.0, 4.0, 7.0, 6.0, 8.0, 6.0, 12.0, 6.0, 10.0, 12.0, 18.0, 15.0, 23.0, 22.0, 20.0, 39.0, 35.0, 46.0, 52.0, 73.0, 109.0, 100.0, 75.0, 46.0, 44.0, 34.0, 21.0, 27.0, 19.0, 16.0, 17.0, 14.0, 7.0, 9.0, 10.0, 8.0, 4.0, 4.0, 5.0, 7.0, 3.0, 4.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0], "bins": [-5.561113357543945e-05, -5.4006464779376984e-05, -5.2401795983314514e-05, -5.0797127187252045e-05, -4.9192458391189575e-05, -4.7587789595127106e-05, -4.5983120799064636e-05, -4.437845200300217e-05, -4.27737832069397e-05, -4.116911441087723e-05, -3.956444561481476e-05, -3.795977681875229e-05, -3.635510802268982e-05, -3.475043922662735e-05, -3.314577043056488e-05, -3.154110163450241e-05, -2.993643283843994e-05, -2.8331764042377472e-05, -2.6727095246315002e-05, -2.5122426450252533e-05, -2.3517757654190063e-05, -2.1913088858127594e-05, -2.0308420062065125e-05, -1.8703751266002655e-05, -1.7099082469940186e-05, -1.5494413673877716e-05, -1.3889744877815247e-05, -1.2285076081752777e-05, -1.0680407285690308e-05, -9.075738489627838e-06, -7.471069693565369e-06, -5.866400897502899e-06, -4.26173210144043e-06, -2.65706330537796e-06, -1.0523945093154907e-06, 5.522742867469788e-07, 2.1569430828094482e-06, 3.7616118788719177e-06, 5.366280674934387e-06, 6.970949470996857e-06, 8.575618267059326e-06, 1.0180287063121796e-05, 1.1784955859184265e-05, 1.3389624655246735e-05, 1.4994293451309204e-05, 1.6598962247371674e-05, 1.8203631043434143e-05, 1.9808299839496613e-05, 2.1412968635559082e-05, 2.301763743162155e-05, 2.462230622768402e-05, 2.622697502374649e-05, 2.783164381980896e-05, 2.943631261587143e-05, 3.10409814119339e-05, 3.264565020799637e-05, 3.425031900405884e-05, 3.585498780012131e-05, 3.745965659618378e-05, 3.9064325392246246e-05, 4.0668994188308716e-05, 4.2273662984371185e-05, 4.3878331780433655e-05, 4.5483000576496124e-05, 4.7087669372558594e-05]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 2.0, 10.0, 21.0, 50.0, 107.0, 249.0, 898.0, 4796.0, 147481.0, 875938.0, 16598.0, 1690.0, 427.0, 176.0, 60.0, 28.0, 11.0, 8.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26806640625, -0.2585716247558594, -0.24907684326171875, -0.23958206176757812, -0.2300872802734375, -0.22059249877929688, -0.21109771728515625, -0.20160293579101562, -0.192108154296875, -0.18261337280273438, -0.17311859130859375, -0.16362380981445312, -0.1541290283203125, -0.14463424682617188, -0.13513946533203125, -0.12564468383789062, -0.11614990234375, -0.10665512084960938, -0.09716033935546875, -0.08766555786132812, -0.0781707763671875, -0.06867599487304688, -0.05918121337890625, -0.049686431884765625, -0.040191650390625, -0.030696868896484375, -0.02120208740234375, -0.011707305908203125, -0.0022125244140625, 0.007282257080078125, 0.01677703857421875, 0.026271820068359375, 0.0357666015625, 0.045261383056640625, 0.05475616455078125, 0.06425094604492188, 0.0737457275390625, 0.08324050903320312, 0.09273529052734375, 0.10223007202148438, 0.111724853515625, 0.12121963500976562, 0.13071441650390625, 0.14020919799804688, 0.1497039794921875, 0.15919876098632812, 0.16869354248046875, 0.17818832397460938, 0.18768310546875, 0.19717788696289062, 0.20667266845703125, 0.21616744995117188, 0.2256622314453125, 0.23515701293945312, 0.24465179443359375, 0.2541465759277344, 0.263641357421875, 0.2731361389160156, 0.28263092041015625, 0.2921257019042969, 0.3016204833984375, 0.3111152648925781, 0.32061004638671875, 0.3301048278808594, 0.339599609375]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 10.0, 10.0, 7.0, 10.0, 18.0, 33.0, 31.0, 59.0, 69.0, 112.0, 122.0, 124.0, 108.0, 82.0, 68.0, 49.0, 28.0, 23.0, 13.0, 13.0, 4.0, 5.0, 4.0, 0.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1805419921875, -0.17526817321777344, -0.16999435424804688, -0.1647205352783203, -0.15944671630859375, -0.1541728973388672, -0.14889907836914062, -0.14362525939941406, -0.1383514404296875, -0.13307762145996094, -0.12780380249023438, -0.12252998352050781, -0.11725616455078125, -0.11198234558105469, -0.10670852661132812, -0.10143470764160156, -0.096160888671875, -0.09088706970214844, -0.08561325073242188, -0.08033943176269531, -0.07506561279296875, -0.06979179382324219, -0.06451797485351562, -0.05924415588378906, -0.0539703369140625, -0.04869651794433594, -0.043422698974609375, -0.03814888000488281, -0.03287506103515625, -0.027601242065429688, -0.022327423095703125, -0.017053604125976562, -0.01177978515625, -0.0065059661865234375, -0.001232147216796875, 0.0040416717529296875, 0.00931549072265625, 0.014589309692382812, 0.019863128662109375, 0.025136947631835938, 0.0304107666015625, 0.03568458557128906, 0.040958404541015625, 0.04623222351074219, 0.05150604248046875, 0.05677986145019531, 0.062053680419921875, 0.06732749938964844, 0.072601318359375, 0.07787513732910156, 0.08314895629882812, 0.08842277526855469, 0.09369659423828125, 0.09897041320800781, 0.10424423217773438, 0.10951805114746094, 0.1147918701171875, 0.12006568908691406, 0.12533950805664062, 0.1306133270263672, 0.13588714599609375, 0.1411609649658203, 0.14643478393554688, 0.15170860290527344, 0.156982421875]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 5.0, 17.0, 80.0, 291.0, 411.0, 176.0, 23.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.352109670639038, -1.1346243619918823, -0.9171390533447266, -0.699653685092926, -0.48216837644577026, -0.2646830081939697, -0.047197699546813965, 0.1702876091003418, 0.38777291774749756, 0.6052582263946533, 0.8227435350418091, 1.0402288436889648, 1.2577142715454102, 1.475199580192566, 1.6926848888397217, 1.9101701974868774, 2.127655506134033, 2.3451409339904785, 2.5626261234283447, 2.78011155128479, 2.9975967407226562, 3.2150821685791016, 3.432567596435547, 3.650052785873413, 3.8675379753112793, 4.085023403167725, 4.30250883102417, 4.519993782043457, 4.737479209899902, 4.954964637756348, 5.172450065612793, 5.389935493469238, 5.607420444488525, 5.824905872344971, 6.042391300201416, 6.259876251220703, 6.477361679077148, 6.694847106933594, 6.912332534790039, 7.129817962646484, 7.3473029136657715, 7.564788341522217, 7.782273769378662, 7.999758720397949, 8.217244148254395, 8.43472957611084, 8.652215003967285, 8.86970043182373, 9.087185859680176, 9.304671287536621, 9.522156715393066, 9.739642143249512, 9.957127571105957, 10.174612045288086, 10.392097473144531, 10.609582901000977, 10.827068328857422, 11.044553756713867, 11.262039184570312, 11.479524612426758, 11.697010040283203, 11.914495468139648, 12.131979942321777, 12.349465370178223, 12.566950798034668]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 5.0, 5.0, 6.0, 5.0, 9.0, 10.0, 12.0, 21.0, 14.0, 17.0, 29.0, 31.0, 34.0, 27.0, 42.0, 37.0, 44.0, 69.0, 62.0, 67.0, 53.0, 49.0, 56.0, 34.0, 38.0, 34.0, 44.0, 35.0, 23.0, 23.0, 15.0, 18.0, 11.0, 8.0, 11.0, 7.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0299534797668457, -1.9568727016448975, -1.8837920427322388, -1.8107112646102905, -1.7376306056976318, -1.6645498275756836, -1.5914690494537354, -1.5183883905410767, -1.445307731628418, -1.3722269535064697, -1.299146294593811, -1.2260655164718628, -1.152984857559204, -1.0799040794372559, -1.0068233013153076, -0.9337426424026489, -0.8606618642807007, -0.7875811457633972, -0.7145004272460938, -0.6414196491241455, -0.5683389902114868, -0.49525824189186096, -0.4221774935722351, -0.34909677505493164, -0.2760160565376282, -0.2029353380203247, -0.12985460460186005, -0.056773871183395386, 0.01630684733390808, 0.08938756585121155, 0.1624683141708374, 0.23554903268814087, 0.30862975120544434, 0.3817104697227478, 0.45479118824005127, 0.5278719663619995, 0.6009526252746582, 0.6740334033966064, 0.7471141219139099, 0.8201948404312134, 0.8932755589485168, 0.9663562774658203, 1.0394370555877686, 1.1125177145004272, 1.1855984926223755, 1.2586791515350342, 1.3317599296569824, 1.4048407077789307, 1.4779213666915894, 1.5510021448135376, 1.6240828037261963, 1.6971635818481445, 1.7702442407608032, 1.8433250188827515, 1.9164056777954102, 1.9894864559173584, 2.0625672340393066, 2.135648012161255, 2.208728790283203, 2.2818093299865723, 2.3548901081085205, 2.4279708862304688, 2.501051664352417, 2.5741324424743652, 2.6472129821777344]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 7.0, 10.0, 8.0, 12.0, 11.0, 20.0, 26.0, 39.0, 47.0, 88.0, 162.0, 261.0, 552.0, 1427.0, 4671.0, 29211.0, 1106717.0, 2985625.0, 55079.0, 6950.0, 1902.0, 652.0, 312.0, 174.0, 90.0, 59.0, 41.0, 31.0, 19.0, 18.0, 15.0, 6.0, 13.0, 3.0, 6.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.341064453125, -0.3310699462890625, -0.321075439453125, -0.3110809326171875, -0.30108642578125, -0.2910919189453125, -0.281097412109375, -0.2711029052734375, -0.2611083984375, -0.2511138916015625, -0.241119384765625, -0.2311248779296875, -0.22113037109375, -0.2111358642578125, -0.201141357421875, -0.1911468505859375, -0.18115234375, -0.1711578369140625, -0.161163330078125, -0.1511688232421875, -0.14117431640625, -0.1311798095703125, -0.121185302734375, -0.1111907958984375, -0.1011962890625, -0.0912017822265625, -0.081207275390625, -0.0712127685546875, -0.06121826171875, -0.0512237548828125, -0.041229248046875, -0.0312347412109375, -0.021240234375, -0.0112457275390625, -0.001251220703125, 0.0087432861328125, 0.01873779296875, 0.0287322998046875, 0.038726806640625, 0.0487213134765625, 0.0587158203125, 0.0687103271484375, 0.078704833984375, 0.0886993408203125, 0.09869384765625, 0.1086883544921875, 0.118682861328125, 0.1286773681640625, 0.138671875, 0.1486663818359375, 0.158660888671875, 0.1686553955078125, 0.17864990234375, 0.1886444091796875, 0.198638916015625, 0.2086334228515625, 0.2186279296875, 0.2286224365234375, 0.238616943359375, 0.2486114501953125, 0.25860595703125, 0.2686004638671875, 0.278594970703125, 0.2885894775390625, 0.298583984375]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 4.0, 2.0, 7.0, 10.0, 15.0, 15.0, 20.0, 37.0, 41.0, 66.0, 95.0, 86.0, 85.0, 85.0, 84.0, 84.0, 62.0, 53.0, 42.0, 40.0, 21.0, 20.0, 8.0, 12.0, 7.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.169921875, -0.16370010375976562, -0.15747833251953125, -0.15125656127929688, -0.1450347900390625, -0.13881301879882812, -0.13259124755859375, -0.12636947631835938, -0.120147705078125, -0.11392593383789062, -0.10770416259765625, -0.10148239135742188, -0.0952606201171875, -0.08903884887695312, -0.08281707763671875, -0.07659530639648438, -0.07037353515625, -0.06415176391601562, -0.05792999267578125, -0.051708221435546875, -0.0454864501953125, -0.039264678955078125, -0.03304290771484375, -0.026821136474609375, -0.020599365234375, -0.014377593994140625, -0.00815582275390625, -0.001934051513671875, 0.0042877197265625, 0.010509490966796875, 0.01673126220703125, 0.022953033447265625, 0.0291748046875, 0.035396575927734375, 0.04161834716796875, 0.047840118408203125, 0.0540618896484375, 0.060283660888671875, 0.06650543212890625, 0.07272720336914062, 0.078948974609375, 0.08517074584960938, 0.09139251708984375, 0.09761428833007812, 0.1038360595703125, 0.11005783081054688, 0.11627960205078125, 0.12250137329101562, 0.12872314453125, 0.13494491577148438, 0.14116668701171875, 0.14738845825195312, 0.1536102294921875, 0.15983200073242188, 0.16605377197265625, 0.17227554321289062, 0.178497314453125, 0.18471908569335938, 0.19094085693359375, 0.19716262817382812, 0.2033843994140625, 0.20960617065429688, 0.21582794189453125, 0.22204971313476562, 0.228271484375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 7.0, 9.0, 9.0, 16.0, 42.0, 67.0, 130.0, 335.0, 1123.0, 5400.0, 69653.0, 3988282.0, 120320.0, 6978.0, 1252.0, 351.0, 136.0, 70.0, 30.0, 26.0, 19.0, 7.0, 3.0, 7.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.408935546875, -0.3941001892089844, -0.37926483154296875, -0.3644294738769531, -0.3495941162109375, -0.3347587585449219, -0.31992340087890625, -0.3050880432128906, -0.290252685546875, -0.2754173278808594, -0.26058197021484375, -0.24574661254882812, -0.2309112548828125, -0.21607589721679688, -0.20124053955078125, -0.18640518188476562, -0.17156982421875, -0.15673446655273438, -0.14189910888671875, -0.12706375122070312, -0.1122283935546875, -0.09739303588867188, -0.08255767822265625, -0.06772232055664062, -0.052886962890625, -0.038051605224609375, -0.02321624755859375, -0.008380889892578125, 0.0064544677734375, 0.021289825439453125, 0.03612518310546875, 0.050960540771484375, 0.0657958984375, 0.08063125610351562, 0.09546661376953125, 0.11030197143554688, 0.1251373291015625, 0.13997268676757812, 0.15480804443359375, 0.16964340209960938, 0.184478759765625, 0.19931411743164062, 0.21414947509765625, 0.22898483276367188, 0.2438201904296875, 0.2586555480957031, 0.27349090576171875, 0.2883262634277344, 0.30316162109375, 0.3179969787597656, 0.33283233642578125, 0.3476676940917969, 0.3625030517578125, 0.3773384094238281, 0.39217376708984375, 0.4070091247558594, 0.421844482421875, 0.4366798400878906, 0.45151519775390625, 0.4663505554199219, 0.4811859130859375, 0.4960212707519531, 0.5108566284179688, 0.5256919860839844, 0.54052734375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 4.0, 1.0, 3.0, 2.0, 6.0, 9.0, 10.0, 9.0, 21.0, 29.0, 50.0, 85.0, 215.0, 530.0, 1074.0, 983.0, 510.0, 237.0, 133.0, 52.0, 39.0, 15.0, 18.0, 14.0, 6.0, 5.0, 5.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.356689453125, -0.34649658203125, -0.3363037109375, -0.32611083984375, -0.31591796875, -0.30572509765625, -0.2955322265625, -0.28533935546875, -0.275146484375, -0.26495361328125, -0.2547607421875, -0.24456787109375, -0.234375, -0.22418212890625, -0.2139892578125, -0.20379638671875, -0.193603515625, -0.18341064453125, -0.1732177734375, -0.16302490234375, -0.15283203125, -0.14263916015625, -0.1324462890625, -0.12225341796875, -0.112060546875, -0.10186767578125, -0.0916748046875, -0.08148193359375, -0.0712890625, -0.06109619140625, -0.0509033203125, -0.04071044921875, -0.030517578125, -0.02032470703125, -0.0101318359375, 6.103515625e-05, 0.01025390625, 0.02044677734375, 0.0306396484375, 0.04083251953125, 0.051025390625, 0.06121826171875, 0.0714111328125, 0.08160400390625, 0.091796875, 0.10198974609375, 0.1121826171875, 0.12237548828125, 0.132568359375, 0.14276123046875, 0.1529541015625, 0.16314697265625, 0.17333984375, 0.18353271484375, 0.1937255859375, 0.20391845703125, 0.214111328125, 0.22430419921875, 0.2344970703125, 0.24468994140625, 0.2548828125, 0.26507568359375, 0.2752685546875, 0.28546142578125, 0.295654296875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 8.0, 6.0, 9.0, 53.0, 123.0, 248.0, 275.0, 164.0, 69.0, 21.0, 17.0, 9.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.164518356323242, -3.0649330615997314, -2.9653477668762207, -2.86576247215271, -2.766177177429199, -2.6665918827056885, -2.5670065879821777, -2.467421293258667, -2.3678359985351562, -2.2682507038116455, -2.1686654090881348, -2.069080114364624, -1.9694948196411133, -1.8699095249176025, -1.7703242301940918, -1.670738935470581, -1.5711535215377808, -1.47156822681427, -1.3719829320907593, -1.2723976373672485, -1.1728123426437378, -1.073227047920227, -0.9736416935920715, -0.8740563988685608, -0.77447110414505, -0.6748858094215393, -0.5753005146980286, -0.47571519017219543, -0.3761298954486847, -0.27654460072517395, -0.17695927619934082, -0.07737398147583008, 0.022211313247680664, 0.121796615421772, 0.22138191759586334, 0.3209672272205353, 0.420552521944046, 0.5201377868652344, 0.6197231411933899, 0.7193084359169006, 0.8188937306404114, 0.9184790253639221, 1.0180643796920776, 1.1176496744155884, 1.2172349691390991, 1.3168202638626099, 1.4164055585861206, 1.5159908533096313, 1.615576148033142, 1.7151614427566528, 1.8147467374801636, 1.9143320322036743, 2.0139174461364746, 2.1135027408599854, 2.213088035583496, 2.312673330307007, 2.4122586250305176, 2.5118439197540283, 2.611429214477539, 2.71101450920105, 2.8105998039245605, 2.9101850986480713, 3.009770393371582, 3.1093556880950928, 3.2089409828186035]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 4.0, 4.0, 8.0, 11.0, 11.0, 12.0, 21.0, 20.0, 16.0, 34.0, 26.0, 29.0, 35.0, 44.0, 46.0, 39.0, 38.0, 60.0, 44.0, 61.0, 50.0, 44.0, 39.0, 33.0, 46.0, 29.0, 30.0, 33.0, 18.0, 23.0, 11.0, 13.0, 19.0, 13.0, 8.0, 8.0, 6.0, 10.0, 5.0, 0.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0129623413085938, -0.9760415554046631, -0.9391207098960876, -0.902199923992157, -0.8652790784835815, -0.8283582925796509, -0.7914375066757202, -0.7545167207717896, -0.7175958752632141, -0.6806750893592834, -0.643754243850708, -0.6068334579467773, -0.5699126720428467, -0.5329918265342712, -0.4960710406303406, -0.4591502249240875, -0.4222294092178345, -0.3853085935115814, -0.34838777780532837, -0.3114669919013977, -0.27454617619514465, -0.2376253604888916, -0.20070455968379974, -0.16378375887870789, -0.12686294317245483, -0.08994213491678238, -0.053021326661109924, -0.01610051840543747, 0.020820289850234985, 0.05774110555648804, 0.0946619063615799, 0.13158270716667175, 0.1685035228729248, 0.20542433857917786, 0.24234513938426971, 0.2792659401893616, 0.3161867558956146, 0.3531075716018677, 0.39002835750579834, 0.4269491732120514, 0.46386998891830444, 0.5007907748222351, 0.5377116203308105, 0.5746324062347412, 0.6115531921386719, 0.6484740376472473, 0.685394823551178, 0.7223156690597534, 0.7592364549636841, 0.7961572408676147, 0.8330780863761902, 0.8699988722801208, 0.9069197177886963, 0.943840503692627, 0.9807612895965576, 1.0176820755004883, 1.054602861404419, 1.0915236473083496, 1.1284444332122803, 1.1653653383255005, 1.2022861242294312, 1.2392069101333618, 1.2761276960372925, 1.3130484819412231, 1.3499693870544434]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 0.0, 2.0, 6.0, 5.0, 9.0, 11.0, 18.0, 19.0, 35.0, 43.0, 47.0, 85.0, 130.0, 222.0, 384.0, 589.0, 1095.0, 2034.0, 3968.0, 8315.0, 18804.0, 47345.0, 128569.0, 343049.0, 308623.0, 111536.0, 41322.0, 16861.0, 7442.0, 3724.0, 1812.0, 973.0, 539.0, 331.0, 237.0, 114.0, 93.0, 46.0, 33.0, 25.0, 19.0, 14.0, 7.0, 11.0, 6.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1553955078125, -0.15037155151367188, -0.14534759521484375, -0.14032363891601562, -0.1352996826171875, -0.13027572631835938, -0.12525177001953125, -0.12022781372070312, -0.115203857421875, -0.11017990112304688, -0.10515594482421875, -0.10013198852539062, -0.0951080322265625, -0.09008407592773438, -0.08506011962890625, -0.08003616333007812, -0.07501220703125, -0.06998825073242188, -0.06496429443359375, -0.059940338134765625, -0.0549163818359375, -0.049892425537109375, -0.04486846923828125, -0.039844512939453125, -0.034820556640625, -0.029796600341796875, -0.02477264404296875, -0.019748687744140625, -0.0147247314453125, -0.009700775146484375, -0.00467681884765625, 0.000347137451171875, 0.00537109375, 0.010395050048828125, 0.01541900634765625, 0.020442962646484375, 0.0254669189453125, 0.030490875244140625, 0.03551483154296875, 0.040538787841796875, 0.045562744140625, 0.050586700439453125, 0.05561065673828125, 0.060634613037109375, 0.0656585693359375, 0.07068252563476562, 0.07570648193359375, 0.08073043823242188, 0.08575439453125, 0.09077835083007812, 0.09580230712890625, 0.10082626342773438, 0.1058502197265625, 0.11087417602539062, 0.11589813232421875, 0.12092208862304688, 0.125946044921875, 0.13097000122070312, 0.13599395751953125, 0.14101791381835938, 0.1460418701171875, 0.15106582641601562, 0.15608978271484375, 0.16111373901367188, 0.1661376953125]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 3.0, 2.0, 3.0, 7.0, 12.0, 24.0, 17.0, 31.0, 41.0, 57.0, 71.0, 99.0, 105.0, 90.0, 81.0, 74.0, 66.0, 56.0, 50.0, 39.0, 22.0, 18.0, 10.0, 14.0, 6.0, 7.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.178955078125, -0.17268753051757812, -0.16641998291015625, -0.16015243530273438, -0.1538848876953125, -0.14761734008789062, -0.14134979248046875, -0.13508224487304688, -0.128814697265625, -0.12254714965820312, -0.11627960205078125, -0.11001205444335938, -0.1037445068359375, -0.09747695922851562, -0.09120941162109375, -0.08494186401367188, -0.07867431640625, -0.07240676879882812, -0.06613922119140625, -0.059871673583984375, -0.0536041259765625, -0.047336578369140625, -0.04106903076171875, -0.034801483154296875, -0.028533935546875, -0.022266387939453125, -0.01599884033203125, -0.009731292724609375, -0.0034637451171875, 0.002803802490234375, 0.00907135009765625, 0.015338897705078125, 0.0216064453125, 0.027873992919921875, 0.03414154052734375, 0.040409088134765625, 0.0466766357421875, 0.052944183349609375, 0.05921173095703125, 0.06547927856445312, 0.071746826171875, 0.07801437377929688, 0.08428192138671875, 0.09054946899414062, 0.0968170166015625, 0.10308456420898438, 0.10935211181640625, 0.11561965942382812, 0.12188720703125, 0.12815475463867188, 0.13442230224609375, 0.14068984985351562, 0.1469573974609375, 0.15322494506835938, 0.15949249267578125, 0.16576004028320312, 0.172027587890625, 0.17829513549804688, 0.18456268310546875, 0.19083023071289062, 0.1970977783203125, 0.20336532592773438, 0.20963287353515625, 0.21590042114257812, 0.22216796875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 6.0, 12.0, 5.0, 6.0, 16.0, 20.0, 25.0, 37.0, 71.0, 133.0, 243.0, 416.0, 757.0, 1864.0, 7165.0, 100265.0, 867009.0, 61758.0, 5573.0, 1626.0, 689.0, 343.0, 177.0, 117.0, 84.0, 47.0, 37.0, 21.0, 8.0, 6.0, 8.0, 3.0, 5.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.394287109375, -0.3787803649902344, -0.36327362060546875, -0.3477668762207031, -0.3322601318359375, -0.3167533874511719, -0.30124664306640625, -0.2857398986816406, -0.270233154296875, -0.2547264099121094, -0.23921966552734375, -0.22371292114257812, -0.2082061767578125, -0.19269943237304688, -0.17719268798828125, -0.16168594360351562, -0.14617919921875, -0.13067245483398438, -0.11516571044921875, -0.09965896606445312, -0.0841522216796875, -0.06864547729492188, -0.05313873291015625, -0.037631988525390625, -0.022125244140625, -0.006618499755859375, 0.00888824462890625, 0.024394989013671875, 0.0399017333984375, 0.055408477783203125, 0.07091522216796875, 0.08642196655273438, 0.1019287109375, 0.11743545532226562, 0.13294219970703125, 0.14844894409179688, 0.1639556884765625, 0.17946243286132812, 0.19496917724609375, 0.21047592163085938, 0.225982666015625, 0.24148941040039062, 0.25699615478515625, 0.2725028991699219, 0.2880096435546875, 0.3035163879394531, 0.31902313232421875, 0.3345298767089844, 0.35003662109375, 0.3655433654785156, 0.38105010986328125, 0.3965568542480469, 0.4120635986328125, 0.4275703430175781, 0.44307708740234375, 0.4585838317871094, 0.474090576171875, 0.4895973205566406, 0.5051040649414062, 0.5206108093261719, 0.5361175537109375, 0.5516242980957031, 0.5671310424804688, 0.5826377868652344, 0.59814453125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 7.0, 3.0, 4.0, 3.0, 10.0, 11.0, 7.0, 8.0, 17.0, 14.0, 19.0, 25.0, 26.0, 23.0, 13.0, 36.0, 29.0, 38.0, 39.0, 44.0, 39.0, 46.0, 34.0, 42.0, 47.0, 42.0, 32.0, 38.0, 28.0, 37.0, 29.0, 32.0, 28.0, 27.0, 16.0, 30.0, 16.0, 14.0, 15.0, 14.0, 4.0, 4.0, 6.0, 2.0, 5.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.369384765625, -0.35717010498046875, -0.3449554443359375, -0.33274078369140625, -0.320526123046875, -0.30831146240234375, -0.2960968017578125, -0.28388214111328125, -0.27166748046875, -0.25945281982421875, -0.2472381591796875, -0.23502349853515625, -0.222808837890625, -0.21059417724609375, -0.1983795166015625, -0.18616485595703125, -0.1739501953125, -0.16173553466796875, -0.1495208740234375, -0.13730621337890625, -0.125091552734375, -0.11287689208984375, -0.1006622314453125, -0.08844757080078125, -0.07623291015625, -0.06401824951171875, -0.0518035888671875, -0.03958892822265625, -0.027374267578125, -0.01515960693359375, -0.0029449462890625, 0.00926971435546875, 0.021484375, 0.03369903564453125, 0.0459136962890625, 0.05812835693359375, 0.070343017578125, 0.08255767822265625, 0.0947723388671875, 0.10698699951171875, 0.11920166015625, 0.13141632080078125, 0.1436309814453125, 0.15584564208984375, 0.168060302734375, 0.18027496337890625, 0.1924896240234375, 0.20470428466796875, 0.2169189453125, 0.22913360595703125, 0.2413482666015625, 0.25356292724609375, 0.265777587890625, 0.27799224853515625, 0.2902069091796875, 0.30242156982421875, 0.31463623046875, 0.32685089111328125, 0.3390655517578125, 0.35128021240234375, 0.363494873046875, 0.37570953369140625, 0.3879241943359375, 0.40013885498046875, 0.412353515625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 4.0, 5.0, 11.0, 17.0, 19.0, 23.0, 46.0, 65.0, 117.0, 200.0, 355.0, 703.0, 1683.0, 5502.0, 27742.0, 341560.0, 622463.0, 37517.0, 6842.0, 1985.0, 768.0, 380.0, 192.0, 120.0, 61.0, 53.0, 31.0, 24.0, 16.0, 12.0, 11.0, 10.0, 5.0, 7.0, 2.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1373291015625, -0.1320629119873047, -0.12679672241210938, -0.12153053283691406, -0.11626434326171875, -0.11099815368652344, -0.10573196411132812, -0.10046577453613281, -0.0951995849609375, -0.08993339538574219, -0.08466720581054688, -0.07940101623535156, -0.07413482666015625, -0.06886863708496094, -0.06360244750976562, -0.05833625793457031, -0.053070068359375, -0.04780387878417969, -0.042537689208984375, -0.03727149963378906, -0.03200531005859375, -0.026739120483398438, -0.021472930908203125, -0.016206741333007812, -0.0109405517578125, -0.0056743621826171875, -0.000408172607421875, 0.0048580169677734375, 0.01012420654296875, 0.015390396118164062, 0.020656585693359375, 0.025922775268554688, 0.03118896484375, 0.03645515441894531, 0.041721343994140625, 0.04698753356933594, 0.05225372314453125, 0.05751991271972656, 0.06278610229492188, 0.06805229187011719, 0.0733184814453125, 0.07858467102050781, 0.08385086059570312, 0.08911705017089844, 0.09438323974609375, 0.09964942932128906, 0.10491561889648438, 0.11018180847167969, 0.115447998046875, 0.12071418762207031, 0.12598037719726562, 0.13124656677246094, 0.13651275634765625, 0.14177894592285156, 0.14704513549804688, 0.1523113250732422, 0.1575775146484375, 0.1628437042236328, 0.16810989379882812, 0.17337608337402344, 0.17864227294921875, 0.18390846252441406, 0.18917465209960938, 0.1944408416748047, 0.19970703125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 6.0, 2.0, 2.0, 6.0, 6.0, 10.0, 14.0, 13.0, 13.0, 22.0, 26.0, 24.0, 48.0, 52.0, 96.0, 133.0, 140.0, 115.0, 83.0, 45.0, 21.0, 21.0, 23.0, 15.0, 15.0, 16.0, 7.0, 8.0, 6.0, 5.0, 0.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.56382942199707e-05, -7.321685552597046e-05, -7.079541683197021e-05, -6.837397813796997e-05, -6.595253944396973e-05, -6.353110074996948e-05, -6.110966205596924e-05, -5.8688223361968994e-05, -5.626678466796875e-05, -5.3845345973968506e-05, -5.142390727996826e-05, -4.900246858596802e-05, -4.6581029891967773e-05, -4.415959119796753e-05, -4.1738152503967285e-05, -3.931671380996704e-05, -3.68952751159668e-05, -3.447383642196655e-05, -3.205239772796631e-05, -2.9630959033966064e-05, -2.720952033996582e-05, -2.4788081645965576e-05, -2.2366642951965332e-05, -1.9945204257965088e-05, -1.7523765563964844e-05, -1.51023268699646e-05, -1.2680888175964355e-05, -1.0259449481964111e-05, -7.838010787963867e-06, -5.416572093963623e-06, -2.995133399963379e-06, -5.736947059631348e-07, 1.8477439880371094e-06, 4.2691826820373535e-06, 6.690621376037598e-06, 9.112060070037842e-06, 1.1533498764038086e-05, 1.395493745803833e-05, 1.6376376152038574e-05, 1.879781484603882e-05, 2.1219253540039062e-05, 2.3640692234039307e-05, 2.606213092803955e-05, 2.8483569622039795e-05, 3.090500831604004e-05, 3.332644701004028e-05, 3.574788570404053e-05, 3.816932439804077e-05, 4.0590763092041016e-05, 4.301220178604126e-05, 4.5433640480041504e-05, 4.785507917404175e-05, 5.027651786804199e-05, 5.2697956562042236e-05, 5.511939525604248e-05, 5.7540833950042725e-05, 5.996227264404297e-05, 6.238371133804321e-05, 6.480515003204346e-05, 6.72265887260437e-05, 6.964802742004395e-05, 7.206946611404419e-05, 7.449090480804443e-05, 7.691234350204468e-05, 7.933378219604492e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 4.0, 7.0, 10.0, 16.0, 9.0, 31.0, 46.0, 69.0, 124.0, 184.0, 357.0, 672.0, 1428.0, 4067.0, 17987.0, 165732.0, 783128.0, 60329.0, 9501.0, 2652.0, 1010.0, 458.0, 310.0, 160.0, 94.0, 69.0, 25.0, 32.0, 18.0, 8.0, 9.0, 6.0, 2.0, 2.0, 5.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.24169921875, -0.23584747314453125, -0.2299957275390625, -0.22414398193359375, -0.218292236328125, -0.21244049072265625, -0.2065887451171875, -0.20073699951171875, -0.19488525390625, -0.18903350830078125, -0.1831817626953125, -0.17733001708984375, -0.171478271484375, -0.16562652587890625, -0.1597747802734375, -0.15392303466796875, -0.1480712890625, -0.14221954345703125, -0.1363677978515625, -0.13051605224609375, -0.124664306640625, -0.11881256103515625, -0.1129608154296875, -0.10710906982421875, -0.10125732421875, -0.09540557861328125, -0.0895538330078125, -0.08370208740234375, -0.077850341796875, -0.07199859619140625, -0.0661468505859375, -0.06029510498046875, -0.054443359375, -0.04859161376953125, -0.0427398681640625, -0.03688812255859375, -0.031036376953125, -0.02518463134765625, -0.0193328857421875, -0.01348114013671875, -0.00762939453125, -0.00177764892578125, 0.0040740966796875, 0.00992584228515625, 0.015777587890625, 0.02162933349609375, 0.0274810791015625, 0.03333282470703125, 0.0391845703125, 0.04503631591796875, 0.0508880615234375, 0.05673980712890625, 0.062591552734375, 0.06844329833984375, 0.0742950439453125, 0.08014678955078125, 0.08599853515625, 0.09185028076171875, 0.0977020263671875, 0.10355377197265625, 0.109405517578125, 0.11525726318359375, 0.1211090087890625, 0.12696075439453125, 0.1328125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 2.0, 4.0, 3.0, 2.0, 4.0, 11.0, 4.0, 7.0, 10.0, 14.0, 10.0, 24.0, 18.0, 17.0, 22.0, 38.0, 38.0, 43.0, 53.0, 44.0, 55.0, 66.0, 67.0, 60.0, 56.0, 50.0, 50.0, 40.0, 39.0, 29.0, 14.0, 21.0, 14.0, 4.0, 9.0, 6.0, 6.0, 12.0, 6.0, 5.0, 3.0, 5.0, 3.0, 3.0, 4.0, 1.0, 3.0, 1.0, 1.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08203125, -0.0791788101196289, -0.07632637023925781, -0.07347393035888672, -0.07062149047851562, -0.06776905059814453, -0.06491661071777344, -0.062064170837402344, -0.05921173095703125, -0.056359291076660156, -0.05350685119628906, -0.05065441131591797, -0.047801971435546875, -0.04494953155517578, -0.04209709167480469, -0.039244651794433594, -0.0363922119140625, -0.033539772033691406, -0.030687332153320312, -0.02783489227294922, -0.024982452392578125, -0.02213001251220703, -0.019277572631835938, -0.016425132751464844, -0.01357269287109375, -0.010720252990722656, -0.007867813110351562, -0.005015373229980469, -0.002162933349609375, 0.0006895065307617188, 0.0035419464111328125, 0.006394386291503906, 0.009246826171875, 0.012099266052246094, 0.014951705932617188, 0.01780414581298828, 0.020656585693359375, 0.02350902557373047, 0.026361465454101562, 0.029213905334472656, 0.03206634521484375, 0.034918785095214844, 0.03777122497558594, 0.04062366485595703, 0.043476104736328125, 0.04632854461669922, 0.04918098449707031, 0.052033424377441406, 0.0548858642578125, 0.057738304138183594, 0.06059074401855469, 0.06344318389892578, 0.06629562377929688, 0.06914806365966797, 0.07200050354003906, 0.07485294342041016, 0.07770538330078125, 0.08055782318115234, 0.08341026306152344, 0.08626270294189453, 0.08911514282226562, 0.09196758270263672, 0.09482002258300781, 0.0976724624633789, 0.10052490234375]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 21.0, 95.0, 283.0, 367.0, 164.0, 44.0, 15.0, 5.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.109798908233643, -4.955634593963623, -4.8014702796936035, -4.647306442260742, -4.493142127990723, -4.338977813720703, -4.184813499450684, -4.030649185180664, -3.8764853477478027, -3.722321033477783, -3.5681569576263428, -3.4139926433563232, -3.259828567504883, -3.1056642532348633, -2.9514999389648438, -2.7973358631134033, -2.643171548843384, -2.4890072345733643, -2.334843158721924, -2.1806788444519043, -2.026514768600464, -1.8723504543304443, -1.7181862592697144, -1.5640220642089844, -1.4098578691482544, -1.2556936740875244, -1.1015294790267944, -0.9473652243614197, -0.7932010293006897, -0.6390368342399597, -0.48487257957458496, -0.330708384513855, -0.176544189453125, -0.022379979491233826, 0.13178423047065735, 0.2859484553337097, 0.4401126503944397, 0.5942768454551697, 0.7484411001205444, 0.9026052951812744, 1.0567694902420044, 1.2109336853027344, 1.3650978803634644, 1.5192620754241943, 1.6734263896942139, 1.8275904655456543, 1.9817547798156738, 2.1359190940856934, 2.290083169937134, 2.4442474842071533, 2.5984115600585938, 2.7525758743286133, 2.9067399501800537, 3.0609042644500732, 3.2150683403015137, 3.369232654571533, 3.5233969688415527, 3.6775612831115723, 3.8317253589630127, 3.9858896732330322, 4.140053749084473, 4.294218063354492, 4.448382377624512, 4.602546691894531, 4.756710529327393]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 4.0, 3.0, 3.0, 6.0, 3.0, 9.0, 16.0, 12.0, 12.0, 10.0, 18.0, 25.0, 17.0, 31.0, 22.0, 29.0, 28.0, 25.0, 35.0, 30.0, 44.0, 53.0, 41.0, 37.0, 48.0, 46.0, 34.0, 35.0, 41.0, 32.0, 30.0, 32.0, 31.0, 22.0, 12.0, 29.0, 13.0, 15.0, 10.0, 17.0, 8.0, 7.0, 8.0, 4.0, 4.0, 2.0, 3.0, 0.0, 2.0, 5.0, 2.0, 1.0, 3.0, 3.0, 2.0], "bins": [-1.4520676136016846, -1.4080214500427246, -1.3639752864837646, -1.3199291229248047, -1.2758829593658447, -1.2318367958068848, -1.1877906322479248, -1.1437444686889648, -1.0996983051300049, -1.055652141571045, -1.011605978012085, -0.967559814453125, -0.923513650894165, -0.8794674873352051, -0.8354212641716003, -0.7913751006126404, -0.7473288774490356, -0.7032827138900757, -0.6592365503311157, -0.6151903867721558, -0.5711442232131958, -0.5270980596542358, -0.4830518364906311, -0.43900567293167114, -0.3949595093727112, -0.3509133458137512, -0.30686718225479126, -0.2628209888935089, -0.21877482533454895, -0.174728661775589, -0.13068246841430664, -0.08663630485534668, -0.04259002208709717, 0.00145614892244339, 0.04550231993198395, 0.0895484983921051, 0.13359466195106506, 0.17764082551002502, 0.22168701887130737, 0.26573318243026733, 0.3097793459892273, 0.35382550954818726, 0.3978716731071472, 0.44191786646842957, 0.4859640300273895, 0.5300102233886719, 0.5740563869476318, 0.6181025505065918, 0.6621487140655518, 0.7061948776245117, 0.7502410411834717, 0.7942872047424316, 0.8383333683013916, 0.8823795318603516, 0.9264257550239563, 0.9704719185829163, 1.0145180225372314, 1.0585641860961914, 1.1026103496551514, 1.1466565132141113, 1.1907026767730713, 1.2347488403320312, 1.2787950038909912, 1.3228411674499512, 1.3668874502182007]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 8.0, 6.0, 6.0, 10.0, 23.0, 21.0, 43.0, 60.0, 99.0, 138.0, 220.0, 418.0, 2251.0, 2331242.0, 1856715.0, 2007.0, 409.0, 201.0, 137.0, 90.0, 59.0, 37.0, 31.0, 21.0, 13.0, 3.0, 5.0, 2.0, 6.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.080078125, -1.0508804321289062, -1.0216827392578125, -0.9924850463867188, -0.963287353515625, -0.9340896606445312, -0.9048919677734375, -0.8756942749023438, -0.84649658203125, -0.8172988891601562, -0.7881011962890625, -0.7589035034179688, -0.729705810546875, -0.7005081176757812, -0.6713104248046875, -0.6421127319335938, -0.6129150390625, -0.5837173461914062, -0.5545196533203125, -0.5253219604492188, -0.496124267578125, -0.46692657470703125, -0.4377288818359375, -0.40853118896484375, -0.37933349609375, -0.35013580322265625, -0.3209381103515625, -0.29174041748046875, -0.262542724609375, -0.23334503173828125, -0.2041473388671875, -0.17494964599609375, -0.145751953125, -0.11655426025390625, -0.0873565673828125, -0.05815887451171875, -0.028961181640625, 0.00023651123046875, 0.0294342041015625, 0.05863189697265625, 0.08782958984375, 0.11702728271484375, 0.1462249755859375, 0.17542266845703125, 0.204620361328125, 0.23381805419921875, 0.2630157470703125, 0.29221343994140625, 0.3214111328125, 0.35060882568359375, 0.3798065185546875, 0.40900421142578125, 0.438201904296875, 0.46739959716796875, 0.4965972900390625, 0.5257949829101562, 0.55499267578125, 0.5841903686523438, 0.6133880615234375, 0.6425857543945312, 0.671783447265625, 0.7009811401367188, 0.7301788330078125, 0.7593765258789062, 0.78857421875]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 4.0, 4.0, 4.0, 4.0, 8.0, 15.0, 25.0, 36.0, 45.0, 58.0, 76.0, 100.0, 96.0, 107.0, 82.0, 79.0, 61.0, 61.0, 43.0, 27.0, 20.0, 21.0, 9.0, 12.0, 7.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1707763671875, -0.1645183563232422, -0.15826034545898438, -0.15200233459472656, -0.14574432373046875, -0.13948631286621094, -0.13322830200195312, -0.1269702911376953, -0.1207122802734375, -0.11445426940917969, -0.10819625854492188, -0.10193824768066406, -0.09568023681640625, -0.08942222595214844, -0.08316421508789062, -0.07690620422363281, -0.070648193359375, -0.06439018249511719, -0.058132171630859375, -0.05187416076660156, -0.04561614990234375, -0.03935813903808594, -0.033100128173828125, -0.026842117309570312, -0.0205841064453125, -0.014326095581054688, -0.008068084716796875, -0.0018100738525390625, 0.00444793701171875, 0.010705947875976562, 0.016963958740234375, 0.023221969604492188, 0.02947998046875, 0.03573799133300781, 0.041996002197265625, 0.04825401306152344, 0.05451202392578125, 0.06077003479003906, 0.06702804565429688, 0.07328605651855469, 0.0795440673828125, 0.08580207824707031, 0.09206008911132812, 0.09831809997558594, 0.10457611083984375, 0.11083412170410156, 0.11709213256835938, 0.12335014343261719, 0.129608154296875, 0.1358661651611328, 0.14212417602539062, 0.14838218688964844, 0.15464019775390625, 0.16089820861816406, 0.16715621948242188, 0.1734142303466797, 0.1796722412109375, 0.1859302520751953, 0.19218826293945312, 0.19844627380371094, 0.20470428466796875, 0.21096229553222656, 0.21722030639648438, 0.2234783172607422, 0.229736328125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 6.0, 8.0, 13.0, 21.0, 38.0, 91.0, 112.0, 263.0, 523.0, 1149.0, 2863.0, 9673.0, 58946.0, 2097616.0, 1955010.0, 54844.0, 8725.0, 2455.0, 918.0, 445.0, 245.0, 120.0, 97.0, 49.0, 29.0, 11.0, 9.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.25146484375, -0.24308013916015625, -0.2346954345703125, -0.22631072998046875, -0.217926025390625, -0.20954132080078125, -0.2011566162109375, -0.19277191162109375, -0.18438720703125, -0.17600250244140625, -0.1676177978515625, -0.15923309326171875, -0.150848388671875, -0.14246368408203125, -0.1340789794921875, -0.12569427490234375, -0.1173095703125, -0.10892486572265625, -0.1005401611328125, -0.09215545654296875, -0.083770751953125, -0.07538604736328125, -0.0670013427734375, -0.05861663818359375, -0.05023193359375, -0.04184722900390625, -0.0334625244140625, -0.02507781982421875, -0.016693115234375, -0.00830841064453125, 7.62939453125e-05, 0.00846099853515625, 0.016845703125, 0.02523040771484375, 0.0336151123046875, 0.04199981689453125, 0.050384521484375, 0.05876922607421875, 0.0671539306640625, 0.07553863525390625, 0.08392333984375, 0.09230804443359375, 0.1006927490234375, 0.10907745361328125, 0.117462158203125, 0.12584686279296875, 0.1342315673828125, 0.14261627197265625, 0.1510009765625, 0.15938568115234375, 0.1677703857421875, 0.17615509033203125, 0.184539794921875, 0.19292449951171875, 0.2013092041015625, 0.20969390869140625, 0.21807861328125, 0.22646331787109375, 0.2348480224609375, 0.24323272705078125, 0.251617431640625, 0.26000213623046875, 0.2683868408203125, 0.27677154541015625, 0.28515625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 8.0, 5.0, 10.0, 8.0, 13.0, 23.0, 35.0, 42.0, 73.0, 153.0, 311.0, 577.0, 907.0, 845.0, 502.0, 253.0, 134.0, 58.0, 45.0, 23.0, 15.0, 9.0, 7.0, 8.0, 2.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.225830078125, -0.21850967407226562, -0.21118927001953125, -0.20386886596679688, -0.1965484619140625, -0.18922805786132812, -0.18190765380859375, -0.17458724975585938, -0.167266845703125, -0.15994644165039062, -0.15262603759765625, -0.14530563354492188, -0.1379852294921875, -0.13066482543945312, -0.12334442138671875, -0.11602401733398438, -0.10870361328125, -0.10138320922851562, -0.09406280517578125, -0.08674240112304688, -0.0794219970703125, -0.07210159301757812, -0.06478118896484375, -0.057460784912109375, -0.050140380859375, -0.042819976806640625, -0.03549957275390625, -0.028179168701171875, -0.0208587646484375, -0.013538360595703125, -0.00621795654296875, 0.001102447509765625, 0.0084228515625, 0.015743255615234375, 0.02306365966796875, 0.030384063720703125, 0.0377044677734375, 0.045024871826171875, 0.05234527587890625, 0.059665679931640625, 0.066986083984375, 0.07430648803710938, 0.08162689208984375, 0.08894729614257812, 0.0962677001953125, 0.10358810424804688, 0.11090850830078125, 0.11822891235351562, 0.12554931640625, 0.13286972045898438, 0.14019012451171875, 0.14751052856445312, 0.1548309326171875, 0.16215133666992188, 0.16947174072265625, 0.17679214477539062, 0.184112548828125, 0.19143295288085938, 0.19875335693359375, 0.20607376098632812, 0.2133941650390625, 0.22071456909179688, 0.22803497314453125, 0.23535537719726562, 0.24267578125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 6.0, 7.0, 20.0, 36.0, 74.0, 129.0, 189.0, 200.0, 163.0, 62.0, 44.0, 30.0, 11.0, 10.0, 8.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.1887683868408203, -2.1335010528564453, -2.0782337188720703, -2.0229663848876953, -1.9676991701126099, -1.9124318361282349, -1.8571646213531494, -1.8018972873687744, -1.7466299533843994, -1.6913626194000244, -1.6360952854156494, -1.580828070640564, -1.525560736656189, -1.470293402671814, -1.4150261878967285, -1.3597588539123535, -1.3044915199279785, -1.2492241859436035, -1.1939568519592285, -1.138689637184143, -1.083422303199768, -1.028154969215393, -0.9728876948356628, -0.9176204204559326, -0.8623530864715576, -0.8070857524871826, -0.7518184781074524, -0.6965512037277222, -0.6412838697433472, -0.5860165357589722, -0.5307492613792419, -0.47548195719718933, -0.4202146530151367, -0.3649473488330841, -0.3096800446510315, -0.2544127404689789, -0.19914543628692627, -0.14387813210487366, -0.08861082792282104, -0.03334352374076843, 0.02192378044128418, 0.07719108462333679, 0.1324583888053894, 0.18772569298744202, 0.24299299716949463, 0.29826030135154724, 0.35352760553359985, 0.40879490971565247, 0.4640622138977051, 0.5193295478820801, 0.5745968222618103, 0.6298640966415405, 0.6851314306259155, 0.7403987646102905, 0.7956660389900208, 0.850933313369751, 0.906200647354126, 0.961467981338501, 1.016735315322876, 1.0720025300979614, 1.1272698640823364, 1.1825371980667114, 1.2378044128417969, 1.2930717468261719, 1.3483390808105469]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 7.0, 6.0, 7.0, 10.0, 11.0, 17.0, 17.0, 27.0, 33.0, 31.0, 41.0, 47.0, 46.0, 63.0, 70.0, 60.0, 65.0, 53.0, 49.0, 59.0, 47.0, 43.0, 44.0, 31.0, 21.0, 20.0, 19.0, 14.0, 17.0, 7.0, 4.0, 6.0, 7.0, 7.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9478108882904053, -0.9135656356811523, -0.8793204426765442, -0.8450751900672913, -0.8108299970626831, -0.7765847444534302, -0.7423394918441772, -0.7080942392349243, -0.6738490462303162, -0.6396037936210632, -0.6053586006164551, -0.5711133480072021, -0.5368680953979492, -0.5026229023933411, -0.46837764978408813, -0.4341324269771576, -0.39988720417022705, -0.3656419813632965, -0.33139675855636597, -0.29715150594711304, -0.2629062831401825, -0.22866106033325195, -0.19441582262516022, -0.16017058491706848, -0.12592536211013794, -0.0916801318526268, -0.05743490159511566, -0.023189671337604523, 0.011055558919906616, 0.04530078172683716, 0.0795460194349289, 0.11379125714302063, 0.14803647994995117, 0.1822817027568817, 0.21652694046497345, 0.2507721781730652, 0.2850174009799957, 0.31926262378692627, 0.3535078763961792, 0.38775309920310974, 0.4219983220100403, 0.4562435448169708, 0.49048876762390137, 0.5247340202331543, 0.5589792728424072, 0.5932244658470154, 0.6274697184562683, 0.6617149114608765, 0.6959601640701294, 0.7302054166793823, 0.7644506096839905, 0.7986958622932434, 0.8329410552978516, 0.8671863079071045, 0.9014315605163574, 0.9356768131256104, 0.9699220061302185, 1.0041671991348267, 1.0384124517440796, 1.0726577043533325, 1.1069029569625854, 1.1411480903625488, 1.1753933429718018, 1.2096385955810547, 1.2438838481903076]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 2.0, 7.0, 8.0, 11.0, 24.0, 21.0, 49.0, 80.0, 94.0, 151.0, 234.0, 419.0, 657.0, 1094.0, 2025.0, 4075.0, 8324.0, 18741.0, 45834.0, 130911.0, 380079.0, 296129.0, 95531.0, 35093.0, 14913.0, 6721.0, 3214.0, 1692.0, 914.0, 521.0, 380.0, 228.0, 127.0, 94.0, 48.0, 49.0, 20.0, 18.0, 4.0, 8.0, 8.0, 5.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.146240234375, -0.1411724090576172, -0.13610458374023438, -0.13103675842285156, -0.12596893310546875, -0.12090110778808594, -0.11583328247070312, -0.11076545715332031, -0.1056976318359375, -0.10062980651855469, -0.09556198120117188, -0.09049415588378906, -0.08542633056640625, -0.08035850524902344, -0.07529067993164062, -0.07022285461425781, -0.065155029296875, -0.06008720397949219, -0.055019378662109375, -0.04995155334472656, -0.04488372802734375, -0.03981590270996094, -0.034748077392578125, -0.029680252075195312, -0.0246124267578125, -0.019544601440429688, -0.014476776123046875, -0.009408950805664062, -0.00434112548828125, 0.0007266998291015625, 0.005794525146484375, 0.010862350463867188, 0.01593017578125, 0.020998001098632812, 0.026065826416015625, 0.031133651733398438, 0.03620147705078125, 0.04126930236816406, 0.046337127685546875, 0.05140495300292969, 0.0564727783203125, 0.06154060363769531, 0.06660842895507812, 0.07167625427246094, 0.07674407958984375, 0.08181190490722656, 0.08687973022460938, 0.09194755554199219, 0.097015380859375, 0.10208320617675781, 0.10715103149414062, 0.11221885681152344, 0.11728668212890625, 0.12235450744628906, 0.12742233276367188, 0.1324901580810547, 0.1375579833984375, 0.1426258087158203, 0.14769363403320312, 0.15276145935058594, 0.15782928466796875, 0.16289710998535156, 0.16796493530273438, 0.1730327606201172, 0.1781005859375]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 8.0, 5.0, 13.0, 17.0, 22.0, 41.0, 43.0, 49.0, 85.0, 71.0, 89.0, 89.0, 97.0, 81.0, 63.0, 46.0, 49.0, 33.0, 28.0, 20.0, 11.0, 10.0, 15.0, 7.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1656494140625, -0.15985107421875, -0.154052734375, -0.14825439453125, -0.1424560546875, -0.13665771484375, -0.130859375, -0.12506103515625, -0.1192626953125, -0.11346435546875, -0.107666015625, -0.10186767578125, -0.0960693359375, -0.09027099609375, -0.08447265625, -0.07867431640625, -0.0728759765625, -0.06707763671875, -0.061279296875, -0.05548095703125, -0.0496826171875, -0.04388427734375, -0.0380859375, -0.03228759765625, -0.0264892578125, -0.02069091796875, -0.014892578125, -0.00909423828125, -0.0032958984375, 0.00250244140625, 0.00830078125, 0.01409912109375, 0.0198974609375, 0.02569580078125, 0.031494140625, 0.03729248046875, 0.0430908203125, 0.04888916015625, 0.0546875, 0.06048583984375, 0.0662841796875, 0.07208251953125, 0.077880859375, 0.08367919921875, 0.0894775390625, 0.09527587890625, 0.10107421875, 0.10687255859375, 0.1126708984375, 0.11846923828125, 0.124267578125, 0.13006591796875, 0.1358642578125, 0.14166259765625, 0.1474609375, 0.15325927734375, 0.1590576171875, 0.16485595703125, 0.170654296875, 0.17645263671875, 0.1822509765625, 0.18804931640625, 0.19384765625, 0.19964599609375, 0.2054443359375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 5.0, 1.0, 8.0, 5.0, 17.0, 19.0, 27.0, 35.0, 86.0, 170.0, 401.0, 1090.0, 4746.0, 56402.0, 891410.0, 85843.0, 6160.0, 1302.0, 439.0, 165.0, 100.0, 51.0, 19.0, 22.0, 14.0, 7.0, 4.0, 7.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.48681640625, -0.46915435791015625, -0.4514923095703125, -0.43383026123046875, -0.416168212890625, -0.39850616455078125, -0.3808441162109375, -0.36318206787109375, -0.34552001953125, -0.32785797119140625, -0.3101959228515625, -0.29253387451171875, -0.274871826171875, -0.25720977783203125, -0.2395477294921875, -0.22188568115234375, -0.2042236328125, -0.18656158447265625, -0.1688995361328125, -0.15123748779296875, -0.133575439453125, -0.11591339111328125, -0.0982513427734375, -0.08058929443359375, -0.06292724609375, -0.04526519775390625, -0.0276031494140625, -0.00994110107421875, 0.007720947265625, 0.02538299560546875, 0.0430450439453125, 0.06070709228515625, 0.078369140625, 0.09603118896484375, 0.1136932373046875, 0.13135528564453125, 0.149017333984375, 0.16667938232421875, 0.1843414306640625, 0.20200347900390625, 0.21966552734375, 0.23732757568359375, 0.2549896240234375, 0.27265167236328125, 0.290313720703125, 0.30797576904296875, 0.3256378173828125, 0.34329986572265625, 0.3609619140625, 0.37862396240234375, 0.3962860107421875, 0.41394805908203125, 0.431610107421875, 0.44927215576171875, 0.4669342041015625, 0.48459625244140625, 0.50225830078125, 0.5199203491210938, 0.5375823974609375, 0.5552444458007812, 0.572906494140625, 0.5905685424804688, 0.6082305908203125, 0.6258926391601562, 0.6435546875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 9.0, 13.0, 15.0, 21.0, 20.0, 23.0, 27.0, 43.0, 51.0, 47.0, 54.0, 50.0, 76.0, 58.0, 66.0, 63.0, 47.0, 49.0, 54.0, 38.0, 35.0, 23.0, 18.0, 26.0, 17.0, 10.0, 6.0, 10.0, 14.0, 7.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.560546875, -0.5442581176757812, -0.5279693603515625, -0.5116806030273438, -0.495391845703125, -0.47910308837890625, -0.4628143310546875, -0.44652557373046875, -0.43023681640625, -0.41394805908203125, -0.3976593017578125, -0.38137054443359375, -0.365081787109375, -0.34879302978515625, -0.3325042724609375, -0.31621551513671875, -0.2999267578125, -0.28363800048828125, -0.2673492431640625, -0.25106048583984375, -0.234771728515625, -0.21848297119140625, -0.2021942138671875, -0.18590545654296875, -0.16961669921875, -0.15332794189453125, -0.1370391845703125, -0.12075042724609375, -0.104461669921875, -0.08817291259765625, -0.0718841552734375, -0.05559539794921875, -0.039306640625, -0.02301788330078125, -0.0067291259765625, 0.00955963134765625, 0.025848388671875, 0.04213714599609375, 0.0584259033203125, 0.07471466064453125, 0.09100341796875, 0.10729217529296875, 0.1235809326171875, 0.13986968994140625, 0.156158447265625, 0.17244720458984375, 0.1887359619140625, 0.20502471923828125, 0.2213134765625, 0.23760223388671875, 0.2538909912109375, 0.27017974853515625, 0.286468505859375, 0.30275726318359375, 0.3190460205078125, 0.33533477783203125, 0.35162353515625, 0.36791229248046875, 0.3842010498046875, 0.40048980712890625, 0.416778564453125, 0.43306732177734375, 0.4493560791015625, 0.46564483642578125, 0.48193359375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 4.0, 3.0, 6.0, 26.0, 14.0, 38.0, 77.0, 136.0, 319.0, 1024.0, 4496.0, 49387.0, 893579.0, 90898.0, 6528.0, 1226.0, 389.0, 187.0, 87.0, 43.0, 25.0, 15.0, 11.0, 12.0, 11.0, 4.0, 2.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.286376953125, -0.2783317565917969, -0.27028656005859375, -0.2622413635253906, -0.2541961669921875, -0.24615097045898438, -0.23810577392578125, -0.23006057739257812, -0.222015380859375, -0.21397018432617188, -0.20592498779296875, -0.19787979125976562, -0.1898345947265625, -0.18178939819335938, -0.17374420166015625, -0.16569900512695312, -0.15765380859375, -0.14960861206054688, -0.14156341552734375, -0.13351821899414062, -0.1254730224609375, -0.11742782592773438, -0.10938262939453125, -0.10133743286132812, -0.093292236328125, -0.08524703979492188, -0.07720184326171875, -0.06915664672851562, -0.0611114501953125, -0.053066253662109375, -0.04502105712890625, -0.036975860595703125, -0.0289306640625, -0.020885467529296875, -0.01284027099609375, -0.004795074462890625, 0.0032501220703125, 0.011295318603515625, 0.01934051513671875, 0.027385711669921875, 0.035430908203125, 0.043476104736328125, 0.05152130126953125, 0.059566497802734375, 0.0676116943359375, 0.07565689086914062, 0.08370208740234375, 0.09174728393554688, 0.09979248046875, 0.10783767700195312, 0.11588287353515625, 0.12392807006835938, 0.1319732666015625, 0.14001846313476562, 0.14806365966796875, 0.15610885620117188, 0.164154052734375, 0.17219924926757812, 0.18024444580078125, 0.18828964233398438, 0.1963348388671875, 0.20438003540039062, 0.21242523193359375, 0.22047042846679688, 0.228515625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 6.0, 7.0, 9.0, 8.0, 15.0, 15.0, 26.0, 19.0, 43.0, 58.0, 92.0, 142.0, 148.0, 123.0, 94.0, 62.0, 47.0, 28.0, 18.0, 12.0, 11.0, 6.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.316205978393555e-05, -9.061768651008606e-05, -8.807331323623657e-05, -8.552893996238708e-05, -8.29845666885376e-05, -8.044019341468811e-05, -7.789582014083862e-05, -7.535144686698914e-05, -7.280707359313965e-05, -7.026270031929016e-05, -6.771832704544067e-05, -6.517395377159119e-05, -6.26295804977417e-05, -6.008520722389221e-05, -5.7540833950042725e-05, -5.499646067619324e-05, -5.245208740234375e-05, -4.990771412849426e-05, -4.7363340854644775e-05, -4.481896758079529e-05, -4.22745943069458e-05, -3.9730221033096313e-05, -3.7185847759246826e-05, -3.464147448539734e-05, -3.209710121154785e-05, -2.9552727937698364e-05, -2.7008354663848877e-05, -2.446398138999939e-05, -2.1919608116149902e-05, -1.9375234842300415e-05, -1.6830861568450928e-05, -1.428648829460144e-05, -1.1742115020751953e-05, -9.197741746902466e-06, -6.6533684730529785e-06, -4.108995199203491e-06, -1.564621925354004e-06, 9.797513484954834e-07, 3.5241246223449707e-06, 6.068497896194458e-06, 8.612871170043945e-06, 1.1157244443893433e-05, 1.370161771774292e-05, 1.6245990991592407e-05, 1.8790364265441895e-05, 2.1334737539291382e-05, 2.387911081314087e-05, 2.6423484086990356e-05, 2.8967857360839844e-05, 3.151223063468933e-05, 3.405660390853882e-05, 3.6600977182388306e-05, 3.914535045623779e-05, 4.168972373008728e-05, 4.423409700393677e-05, 4.6778470277786255e-05, 4.932284355163574e-05, 5.186721682548523e-05, 5.441159009933472e-05, 5.6955963373184204e-05, 5.950033664703369e-05, 6.204470992088318e-05, 6.458908319473267e-05, 6.713345646858215e-05, 6.967782974243164e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 5.0, 5.0, 8.0, 18.0, 26.0, 38.0, 47.0, 88.0, 159.0, 306.0, 563.0, 1382.0, 3990.0, 17310.0, 166090.0, 782866.0, 61911.0, 9281.0, 2499.0, 967.0, 443.0, 235.0, 109.0, 78.0, 54.0, 25.0, 21.0, 8.0, 6.0, 2.0, 4.0, 4.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1778564453125, -0.17217636108398438, -0.16649627685546875, -0.16081619262695312, -0.1551361083984375, -0.14945602416992188, -0.14377593994140625, -0.13809585571289062, -0.132415771484375, -0.12673568725585938, -0.12105560302734375, -0.11537551879882812, -0.1096954345703125, -0.10401535034179688, -0.09833526611328125, -0.09265518188476562, -0.08697509765625, -0.08129501342773438, -0.07561492919921875, -0.06993484497070312, -0.0642547607421875, -0.058574676513671875, -0.05289459228515625, -0.047214508056640625, -0.041534423828125, -0.035854339599609375, -0.03017425537109375, -0.024494171142578125, -0.0188140869140625, -0.013134002685546875, -0.00745391845703125, -0.001773834228515625, 0.00390625, 0.009586334228515625, 0.01526641845703125, 0.020946502685546875, 0.0266265869140625, 0.032306671142578125, 0.03798675537109375, 0.043666839599609375, 0.049346923828125, 0.055027008056640625, 0.06070709228515625, 0.06638717651367188, 0.0720672607421875, 0.07774734497070312, 0.08342742919921875, 0.08910751342773438, 0.09478759765625, 0.10046768188476562, 0.10614776611328125, 0.11182785034179688, 0.1175079345703125, 0.12318801879882812, 0.12886810302734375, 0.13454818725585938, 0.140228271484375, 0.14590835571289062, 0.15158843994140625, 0.15726852416992188, 0.1629486083984375, 0.16862869262695312, 0.17430877685546875, 0.17998886108398438, 0.1856689453125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 0.0, 3.0, 4.0, 5.0, 9.0, 12.0, 20.0, 13.0, 13.0, 33.0, 41.0, 67.0, 84.0, 92.0, 127.0, 111.0, 94.0, 79.0, 53.0, 39.0, 23.0, 23.0, 18.0, 9.0, 10.0, 7.0, 6.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.143310546875, -0.13866043090820312, -0.13401031494140625, -0.12936019897460938, -0.1247100830078125, -0.12005996704101562, -0.11540985107421875, -0.11075973510742188, -0.106109619140625, -0.10145950317382812, -0.09680938720703125, -0.09215927124023438, -0.0875091552734375, -0.08285903930664062, -0.07820892333984375, -0.07355880737304688, -0.06890869140625, -0.06425857543945312, -0.05960845947265625, -0.054958343505859375, -0.0503082275390625, -0.045658111572265625, -0.04100799560546875, -0.036357879638671875, -0.031707763671875, -0.027057647705078125, -0.02240753173828125, -0.017757415771484375, -0.0131072998046875, -0.008457183837890625, -0.00380706787109375, 0.000843048095703125, 0.0054931640625, 0.010143280029296875, 0.01479339599609375, 0.019443511962890625, 0.0240936279296875, 0.028743743896484375, 0.03339385986328125, 0.038043975830078125, 0.042694091796875, 0.047344207763671875, 0.05199432373046875, 0.056644439697265625, 0.0612945556640625, 0.06594467163085938, 0.07059478759765625, 0.07524490356445312, 0.07989501953125, 0.08454513549804688, 0.08919525146484375, 0.09384536743164062, 0.0984954833984375, 0.10314559936523438, 0.10779571533203125, 0.11244583129882812, 0.117095947265625, 0.12174606323242188, 0.12639617919921875, 0.13104629516601562, 0.1356964111328125, 0.14034652709960938, 0.14499664306640625, 0.14964675903320312, 0.154296875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 1.0, 3.0, 1.0, 3.0, 4.0, 5.0, 20.0, 66.0, 173.0, 365.0, 238.0, 78.0, 32.0, 10.0, 8.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0597400665283203, -2.9184553623199463, -2.7771706581115723, -2.6358859539031982, -2.494601249694824, -2.35331654548645, -2.212031841278076, -2.070747137069702, -1.9294624328613281, -1.788177728652954, -1.64689302444458, -1.505608320236206, -1.364323616027832, -1.223038911819458, -1.081754207611084, -0.94046950340271, -0.7991847991943359, -0.6579000949859619, -0.5166153907775879, -0.37533068656921387, -0.23404598236083984, -0.09276127815246582, 0.0485234260559082, 0.18980813026428223, 0.33109283447265625, 0.4723775386810303, 0.6136622428894043, 0.7549469470977783, 0.8962316513061523, 1.0375163555145264, 1.1788010597229004, 1.3200857639312744, 1.4613704681396484, 1.6026551723480225, 1.7439398765563965, 1.8852245807647705, 2.0265092849731445, 2.1677939891815186, 2.3090786933898926, 2.4503633975982666, 2.5916481018066406, 2.7329328060150146, 2.8742175102233887, 3.0155022144317627, 3.1567869186401367, 3.2980716228485107, 3.4393563270568848, 3.580641031265259, 3.721925735473633, 3.863210439682007, 4.004495143890381, 4.145779609680176, 4.287064552307129, 4.428349494934082, 4.569633960723877, 4.710918426513672, 4.852203369140625, 4.993488311767578, 5.134772777557373, 5.276057243347168, 5.417342185974121, 5.558627128601074, 5.699911594390869, 5.841196060180664, 5.982481002807617]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 2.0, 2.0, 10.0, 7.0, 12.0, 13.0, 15.0, 10.0, 13.0, 23.0, 31.0, 32.0, 49.0, 43.0, 36.0, 52.0, 70.0, 81.0, 61.0, 67.0, 60.0, 34.0, 54.0, 38.0, 32.0, 31.0, 24.0, 15.0, 21.0, 18.0, 15.0, 7.0, 7.0, 5.0, 4.0, 6.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4749722480773926, -2.408628225326538, -2.3422842025756836, -2.275940179824829, -2.2095961570739746, -2.14325213432312, -2.0769081115722656, -2.0105643272399902, -1.9442201852798462, -1.8778761625289917, -1.8115321397781372, -1.7451881170272827, -1.6788442134857178, -1.6125001907348633, -1.5461561679840088, -1.4798121452331543, -1.4134681224822998, -1.3471240997314453, -1.2807800769805908, -1.2144360542297363, -1.1480920314788818, -1.0817480087280273, -1.0154041051864624, -0.9490600824356079, -0.8827160596847534, -0.8163720369338989, -0.7500280141830444, -0.6836840510368347, -0.6173400282859802, -0.5509960055351257, -0.48465201258659363, -0.4183080196380615, -0.35196399688720703, -0.28561997413635254, -0.21927598118782043, -0.15293197333812714, -0.08658796548843384, -0.020243942737579346, 0.04610005021095276, 0.11244404315948486, 0.17878806591033936, 0.24513207376003265, 0.31147608160972595, 0.37782007455825806, 0.44416409730911255, 0.510508120059967, 0.5768520832061768, 0.6431961059570312, 0.7095401287078857, 0.7758841514587402, 0.8422281742095947, 0.9085721373558044, 0.9749161601066589, 1.0412602424621582, 1.1076041460037231, 1.1739481687545776, 1.2402921915054321, 1.3066362142562866, 1.3729802370071411, 1.4393242597579956, 1.5056681632995605, 1.572012186050415, 1.6383562088012695, 1.704700231552124, 1.7710442543029785]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 0.0, 3.0, 2.0, 2.0, 5.0, 10.0, 9.0, 15.0, 33.0, 39.0, 79.0, 140.0, 288.0, 571.0, 1343.0, 3751.0, 13661.0, 91097.0, 1614275.0, 2305185.0, 139064.0, 17357.0, 4404.0, 1515.0, 686.0, 314.0, 170.0, 104.0, 81.0, 26.0, 23.0, 20.0, 7.0, 5.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1705322265625, -0.164459228515625, -0.15838623046875, -0.152313232421875, -0.146240234375, -0.140167236328125, -0.13409423828125, -0.128021240234375, -0.1219482421875, -0.115875244140625, -0.10980224609375, -0.103729248046875, -0.09765625, -0.091583251953125, -0.08551025390625, -0.079437255859375, -0.0733642578125, -0.067291259765625, -0.06121826171875, -0.055145263671875, -0.049072265625, -0.042999267578125, -0.03692626953125, -0.030853271484375, -0.0247802734375, -0.018707275390625, -0.01263427734375, -0.006561279296875, -0.00048828125, 0.005584716796875, 0.01165771484375, 0.017730712890625, 0.0238037109375, 0.029876708984375, 0.03594970703125, 0.042022705078125, 0.048095703125, 0.054168701171875, 0.06024169921875, 0.066314697265625, 0.0723876953125, 0.078460693359375, 0.08453369140625, 0.090606689453125, 0.0966796875, 0.102752685546875, 0.10882568359375, 0.114898681640625, 0.1209716796875, 0.127044677734375, 0.13311767578125, 0.139190673828125, 0.145263671875, 0.151336669921875, 0.15740966796875, 0.163482666015625, 0.1695556640625, 0.175628662109375, 0.18170166015625, 0.187774658203125, 0.19384765625, 0.199920654296875, 0.20599365234375, 0.212066650390625, 0.2181396484375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 0.0, 6.0, 13.0, 14.0, 10.0, 13.0, 35.0, 44.0, 58.0, 65.0, 84.0, 111.0, 106.0, 78.0, 79.0, 76.0, 52.0, 44.0, 39.0, 23.0, 17.0, 11.0, 8.0, 10.0, 4.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.165771484375, -0.1597614288330078, -0.15375137329101562, -0.14774131774902344, -0.14173126220703125, -0.13572120666503906, -0.12971115112304688, -0.12370109558105469, -0.1176910400390625, -0.11168098449707031, -0.10567092895507812, -0.09966087341308594, -0.09365081787109375, -0.08764076232910156, -0.08163070678710938, -0.07562065124511719, -0.069610595703125, -0.06360054016113281, -0.057590484619140625, -0.05158042907714844, -0.04557037353515625, -0.03956031799316406, -0.033550262451171875, -0.027540206909179688, -0.0215301513671875, -0.015520095825195312, -0.009510040283203125, -0.0034999847412109375, 0.00251007080078125, 0.008520126342773438, 0.014530181884765625, 0.020540237426757812, 0.02655029296875, 0.03256034851074219, 0.038570404052734375, 0.04458045959472656, 0.05059051513671875, 0.05660057067871094, 0.06261062622070312, 0.06862068176269531, 0.0746307373046875, 0.08064079284667969, 0.08665084838867188, 0.09266090393066406, 0.09867095947265625, 0.10468101501464844, 0.11069107055664062, 0.11670112609863281, 0.122711181640625, 0.1287212371826172, 0.13473129272460938, 0.14074134826660156, 0.14675140380859375, 0.15276145935058594, 0.15877151489257812, 0.1647815704345703, 0.1707916259765625, 0.1768016815185547, 0.18281173706054688, 0.18882179260253906, 0.19483184814453125, 0.20084190368652344, 0.20685195922851562, 0.2128620147705078, 0.2188720703125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 12.0, 9.0, 19.0, 30.0, 32.0, 68.0, 153.0, 334.0, 772.0, 2129.0, 8854.0, 89400.0, 3726889.0, 341366.0, 18270.0, 3967.0, 1127.0, 443.0, 194.0, 89.0, 57.0, 21.0, 14.0, 8.0, 8.0, 8.0, 6.0, 2.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.35400390625, -0.3416595458984375, -0.329315185546875, -0.3169708251953125, -0.30462646484375, -0.2922821044921875, -0.279937744140625, -0.2675933837890625, -0.2552490234375, -0.2429046630859375, -0.230560302734375, -0.2182159423828125, -0.20587158203125, -0.1935272216796875, -0.181182861328125, -0.1688385009765625, -0.156494140625, -0.1441497802734375, -0.131805419921875, -0.1194610595703125, -0.10711669921875, -0.0947723388671875, -0.082427978515625, -0.0700836181640625, -0.0577392578125, -0.0453948974609375, -0.033050537109375, -0.0207061767578125, -0.00836181640625, 0.0039825439453125, 0.016326904296875, 0.0286712646484375, 0.041015625, 0.0533599853515625, 0.065704345703125, 0.0780487060546875, 0.09039306640625, 0.1027374267578125, 0.115081787109375, 0.1274261474609375, 0.1397705078125, 0.1521148681640625, 0.164459228515625, 0.1768035888671875, 0.18914794921875, 0.2014923095703125, 0.213836669921875, 0.2261810302734375, 0.238525390625, 0.2508697509765625, 0.263214111328125, 0.2755584716796875, 0.28790283203125, 0.3002471923828125, 0.312591552734375, 0.3249359130859375, 0.3372802734375, 0.3496246337890625, 0.361968994140625, 0.3743133544921875, 0.38665771484375, 0.3990020751953125, 0.411346435546875, 0.4236907958984375, 0.43603515625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 6.0, 10.0, 9.0, 10.0, 14.0, 16.0, 33.0, 41.0, 69.0, 119.0, 279.0, 484.0, 935.0, 894.0, 569.0, 246.0, 134.0, 73.0, 35.0, 28.0, 17.0, 11.0, 9.0, 7.0, 5.0, 7.0, 4.0, 1.0, 1.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.30322265625, -0.29309844970703125, -0.2829742431640625, -0.27285003662109375, -0.262725830078125, -0.25260162353515625, -0.2424774169921875, -0.23235321044921875, -0.22222900390625, -0.21210479736328125, -0.2019805908203125, -0.19185638427734375, -0.181732177734375, -0.17160797119140625, -0.1614837646484375, -0.15135955810546875, -0.1412353515625, -0.13111114501953125, -0.1209869384765625, -0.11086273193359375, -0.100738525390625, -0.09061431884765625, -0.0804901123046875, -0.07036590576171875, -0.06024169921875, -0.05011749267578125, -0.0399932861328125, -0.02986907958984375, -0.019744873046875, -0.00962066650390625, 0.0005035400390625, 0.01062774658203125, 0.020751953125, 0.03087615966796875, 0.0410003662109375, 0.05112457275390625, 0.061248779296875, 0.07137298583984375, 0.0814971923828125, 0.09162139892578125, 0.10174560546875, 0.11186981201171875, 0.1219940185546875, 0.13211822509765625, 0.142242431640625, 0.15236663818359375, 0.1624908447265625, 0.17261505126953125, 0.1827392578125, 0.19286346435546875, 0.2029876708984375, 0.21311187744140625, 0.223236083984375, 0.23336029052734375, 0.2434844970703125, 0.25360870361328125, 0.26373291015625, 0.27385711669921875, 0.2839813232421875, 0.29410552978515625, 0.304229736328125, 0.31435394287109375, 0.3244781494140625, 0.33460235595703125, 0.3447265625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 1.0, 1.0, 1.0, 2.0, 5.0, 9.0, 15.0, 68.0, 267.0, 390.0, 156.0, 53.0, 12.0, 11.0, 9.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.670238494873047, -5.513584136962891, -5.356929302215576, -5.200274467468262, -5.0436201095581055, -4.886965751647949, -4.730310916900635, -4.57365608215332, -4.417001724243164, -4.260347366333008, -4.103692531585693, -3.947037935256958, -3.7903833389282227, -3.6337287425994873, -3.477074146270752, -3.3204195499420166, -3.1637649536132812, -3.007110357284546, -2.8504557609558105, -2.693801164627075, -2.53714656829834, -2.3804919719696045, -2.223837375640869, -2.067182779312134, -1.9105281829833984, -1.753873586654663, -1.5972189903259277, -1.4405643939971924, -1.283909797668457, -1.1272552013397217, -0.9706006050109863, -0.813946008682251, -0.6572914123535156, -0.5006368160247803, -0.3439822196960449, -0.18732762336730957, -0.03067302703857422, 0.12598156929016113, 0.2826361656188965, 0.43929076194763184, 0.5959453582763672, 0.7525999546051025, 0.9092545509338379, 1.0659091472625732, 1.2225637435913086, 1.379218339920044, 1.5358729362487793, 1.6925275325775146, 1.84918212890625, 2.0058367252349854, 2.1624913215637207, 2.319145917892456, 2.4758005142211914, 2.6324551105499268, 2.789109706878662, 2.9457643032073975, 3.102418899536133, 3.259073495864868, 3.4157280921936035, 3.572382688522339, 3.729037284851074, 3.8856918811798096, 4.042346477508545, 4.199001312255859, 4.355655670166016]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 6.0, 15.0, 11.0, 23.0, 26.0, 27.0, 67.0, 65.0, 69.0, 96.0, 81.0, 94.0, 97.0, 72.0, 62.0, 64.0, 44.0, 26.0, 18.0, 16.0, 13.0, 7.0, 3.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1853229999542236, -2.1063454151153564, -2.0273680686950684, -1.9483904838562012, -1.8694130182266235, -1.790435552597046, -1.7114579677581787, -1.632480502128601, -1.5535030364990234, -1.4745255708694458, -1.3955481052398682, -1.316570520401001, -1.2375930547714233, -1.1586155891418457, -1.0796380043029785, -1.0006605386734009, -0.9216830730438232, -0.8427056074142456, -0.7637280821800232, -0.6847505569458008, -0.6057730913162231, -0.5267956256866455, -0.4478181004524231, -0.3688405752182007, -0.28986310958862305, -0.21088561415672302, -0.131908118724823, -0.052930623292922974, 0.02604687213897705, 0.10502436757087708, 0.1840018630027771, 0.2629793882369995, 0.34195709228515625, 0.4209345877170563, 0.4999120831489563, 0.5788896083831787, 0.6578670740127563, 0.736844539642334, 0.8158220648765564, 0.8947995901107788, 0.9737770557403564, 1.052754521369934, 1.1317319869995117, 1.210709571838379, 1.2896870374679565, 1.3686645030975342, 1.4476420879364014, 1.526619553565979, 1.6055970191955566, 1.6845744848251343, 1.763551950454712, 1.842529535293579, 1.9215070009231567, 2.0004844665527344, 2.0794620513916016, 2.1584396362304688, 2.237416982650757, 2.316394567489624, 2.395371913909912, 2.4743494987487793, 2.5533270835876465, 2.6323044300079346, 2.7112820148468018, 2.79025936126709, 2.869236946105957]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 8.0, 4.0, 13.0, 20.0, 25.0, 37.0, 77.0, 150.0, 200.0, 363.0, 712.0, 1498.0, 3439.0, 8996.0, 26759.0, 90799.0, 322095.0, 411186.0, 126633.0, 35767.0, 11699.0, 4352.0, 1832.0, 891.0, 438.0, 250.0, 123.0, 67.0, 42.0, 28.0, 14.0, 8.0, 12.0, 7.0, 4.0, 3.0, 5.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2337646484375, -0.2271099090576172, -0.22045516967773438, -0.21380043029785156, -0.20714569091796875, -0.20049095153808594, -0.19383621215820312, -0.1871814727783203, -0.1805267333984375, -0.1738719940185547, -0.16721725463867188, -0.16056251525878906, -0.15390777587890625, -0.14725303649902344, -0.14059829711914062, -0.1339435577392578, -0.127288818359375, -0.12063407897949219, -0.11397933959960938, -0.10732460021972656, -0.10066986083984375, -0.09401512145996094, -0.08736038208007812, -0.08070564270019531, -0.0740509033203125, -0.06739616394042969, -0.060741424560546875, -0.05408668518066406, -0.04743194580078125, -0.04077720642089844, -0.034122467041015625, -0.027467727661132812, -0.02081298828125, -0.014158248901367188, -0.007503509521484375, -0.0008487701416015625, 0.00580596923828125, 0.012460708618164062, 0.019115447998046875, 0.025770187377929688, 0.0324249267578125, 0.03907966613769531, 0.045734405517578125, 0.05238914489746094, 0.05904388427734375, 0.06569862365722656, 0.07235336303710938, 0.07900810241699219, 0.085662841796875, 0.09231758117675781, 0.09897232055664062, 0.10562705993652344, 0.11228179931640625, 0.11893653869628906, 0.12559127807617188, 0.1322460174560547, 0.1389007568359375, 0.1455554962158203, 0.15221023559570312, 0.15886497497558594, 0.16551971435546875, 0.17217445373535156, 0.17882919311523438, 0.1854839324951172, 0.192138671875]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 4.0, 2.0, 1.0, 1.0, 3.0, 3.0, 7.0, 12.0, 19.0, 13.0, 29.0, 46.0, 57.0, 59.0, 80.0, 100.0, 75.0, 102.0, 75.0, 90.0, 54.0, 50.0, 48.0, 18.0, 20.0, 13.0, 7.0, 12.0, 1.0, 6.0, 5.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1500244140625, -0.14399337768554688, -0.13796234130859375, -0.13193130493164062, -0.1259002685546875, -0.11986923217773438, -0.11383819580078125, -0.10780715942382812, -0.101776123046875, -0.09574508666992188, -0.08971405029296875, -0.08368301391601562, -0.0776519775390625, -0.07162094116210938, -0.06558990478515625, -0.059558868408203125, -0.05352783203125, -0.047496795654296875, -0.04146575927734375, -0.035434722900390625, -0.0294036865234375, -0.023372650146484375, -0.01734161376953125, -0.011310577392578125, -0.005279541015625, 0.000751495361328125, 0.00678253173828125, 0.012813568115234375, 0.0188446044921875, 0.024875640869140625, 0.03090667724609375, 0.036937713623046875, 0.04296875, 0.048999786376953125, 0.05503082275390625, 0.061061859130859375, 0.0670928955078125, 0.07312393188476562, 0.07915496826171875, 0.08518600463867188, 0.091217041015625, 0.09724807739257812, 0.10327911376953125, 0.10931015014648438, 0.1153411865234375, 0.12137222290039062, 0.12740325927734375, 0.13343429565429688, 0.13946533203125, 0.14549636840820312, 0.15152740478515625, 0.15755844116210938, 0.1635894775390625, 0.16962051391601562, 0.17565155029296875, 0.18168258666992188, 0.187713623046875, 0.19374465942382812, 0.19977569580078125, 0.20580673217773438, 0.2118377685546875, 0.21786880493164062, 0.22389984130859375, 0.22993087768554688, 0.2359619140625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 5.0, 7.0, 6.0, 21.0, 20.0, 27.0, 41.0, 60.0, 96.0, 146.0, 230.0, 434.0, 872.0, 1733.0, 4858.0, 25587.0, 603412.0, 382197.0, 20992.0, 4319.0, 1682.0, 764.0, 420.0, 227.0, 146.0, 89.0, 52.0, 42.0, 22.0, 14.0, 11.0, 5.0, 4.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.57861328125, -0.5620613098144531, -0.5455093383789062, -0.5289573669433594, -0.5124053955078125, -0.4958534240722656, -0.47930145263671875, -0.4627494812011719, -0.446197509765625, -0.4296455383300781, -0.41309356689453125, -0.3965415954589844, -0.3799896240234375, -0.3634376525878906, -0.34688568115234375, -0.3303337097167969, -0.31378173828125, -0.2972297668457031, -0.28067779541015625, -0.2641258239746094, -0.2475738525390625, -0.23102188110351562, -0.21446990966796875, -0.19791793823242188, -0.181365966796875, -0.16481399536132812, -0.14826202392578125, -0.13171005249023438, -0.1151580810546875, -0.09860610961914062, -0.08205413818359375, -0.06550216674804688, -0.0489501953125, -0.032398223876953125, -0.01584625244140625, 0.000705718994140625, 0.0172576904296875, 0.033809661865234375, 0.05036163330078125, 0.06691360473632812, 0.083465576171875, 0.10001754760742188, 0.11656951904296875, 0.13312149047851562, 0.1496734619140625, 0.16622543334960938, 0.18277740478515625, 0.19932937622070312, 0.21588134765625, 0.23243331909179688, 0.24898529052734375, 0.2655372619628906, 0.2820892333984375, 0.2986412048339844, 0.31519317626953125, 0.3317451477050781, 0.348297119140625, 0.3648490905761719, 0.38140106201171875, 0.3979530334472656, 0.4145050048828125, 0.4310569763183594, 0.44760894775390625, 0.4641609191894531, 0.480712890625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 6.0, 9.0, 8.0, 9.0, 6.0, 15.0, 10.0, 24.0, 18.0, 23.0, 33.0, 34.0, 40.0, 31.0, 41.0, 65.0, 60.0, 41.0, 66.0, 58.0, 59.0, 46.0, 51.0, 38.0, 41.0, 29.0, 41.0, 11.0, 24.0, 13.0, 12.0, 8.0, 11.0, 6.0, 4.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.62744140625, -0.6097564697265625, -0.592071533203125, -0.5743865966796875, -0.55670166015625, -0.5390167236328125, -0.521331787109375, -0.5036468505859375, -0.4859619140625, -0.4682769775390625, -0.450592041015625, -0.4329071044921875, -0.41522216796875, -0.3975372314453125, -0.379852294921875, -0.3621673583984375, -0.344482421875, -0.3267974853515625, -0.309112548828125, -0.2914276123046875, -0.27374267578125, -0.2560577392578125, -0.238372802734375, -0.2206878662109375, -0.2030029296875, -0.1853179931640625, -0.167633056640625, -0.1499481201171875, -0.13226318359375, -0.1145782470703125, -0.096893310546875, -0.0792083740234375, -0.0615234375, -0.0438385009765625, -0.026153564453125, -0.0084686279296875, 0.00921630859375, 0.0269012451171875, 0.044586181640625, 0.0622711181640625, 0.0799560546875, 0.0976409912109375, 0.115325927734375, 0.1330108642578125, 0.15069580078125, 0.1683807373046875, 0.186065673828125, 0.2037506103515625, 0.221435546875, 0.2391204833984375, 0.256805419921875, 0.2744903564453125, 0.29217529296875, 0.3098602294921875, 0.327545166015625, 0.3452301025390625, 0.3629150390625, 0.3805999755859375, 0.398284912109375, 0.4159698486328125, 0.43365478515625, 0.4513397216796875, 0.469024658203125, 0.4867095947265625, 0.50439453125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 4.0, 2.0, 10.0, 23.0, 53.0, 115.0, 411.0, 2031.0, 35247.0, 982066.0, 26264.0, 1755.0, 362.0, 125.0, 37.0, 23.0, 4.0, 8.0, 3.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.55908203125, -0.544158935546875, -0.52923583984375, -0.514312744140625, -0.4993896484375, -0.484466552734375, -0.46954345703125, -0.454620361328125, -0.439697265625, -0.424774169921875, -0.40985107421875, -0.394927978515625, -0.3800048828125, -0.365081787109375, -0.35015869140625, -0.335235595703125, -0.3203125, -0.305389404296875, -0.29046630859375, -0.275543212890625, -0.2606201171875, -0.245697021484375, -0.23077392578125, -0.215850830078125, -0.200927734375, -0.186004638671875, -0.17108154296875, -0.156158447265625, -0.1412353515625, -0.126312255859375, -0.11138916015625, -0.096466064453125, -0.08154296875, -0.066619873046875, -0.05169677734375, -0.036773681640625, -0.0218505859375, -0.006927490234375, 0.00799560546875, 0.022918701171875, 0.037841796875, 0.052764892578125, 0.06768798828125, 0.082611083984375, 0.0975341796875, 0.112457275390625, 0.12738037109375, 0.142303466796875, 0.1572265625, 0.172149658203125, 0.18707275390625, 0.201995849609375, 0.2169189453125, 0.231842041015625, 0.24676513671875, 0.261688232421875, 0.276611328125, 0.291534423828125, 0.30645751953125, 0.321380615234375, 0.3363037109375, 0.351226806640625, 0.36614990234375, 0.381072998046875, 0.39599609375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 4.0, 1.0, 5.0, 5.0, 9.0, 9.0, 7.0, 9.0, 17.0, 15.0, 25.0, 24.0, 18.0, 30.0, 49.0, 37.0, 71.0, 69.0, 110.0, 99.0, 83.0, 61.0, 48.0, 33.0, 19.0, 25.0, 22.0, 19.0, 12.0, 9.0, 10.0, 4.0, 8.0, 11.0, 7.0, 3.0, 5.0, 4.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.35981559753418e-05, -6.16004690527916e-05, -5.9602782130241394e-05, -5.760509520769119e-05, -5.560740828514099e-05, -5.360972136259079e-05, -5.161203444004059e-05, -4.961434751749039e-05, -4.7616660594940186e-05, -4.5618973672389984e-05, -4.362128674983978e-05, -4.162359982728958e-05, -3.962591290473938e-05, -3.762822598218918e-05, -3.563053905963898e-05, -3.3632852137088776e-05, -3.1635165214538574e-05, -2.9637478291988373e-05, -2.763979136943817e-05, -2.564210444688797e-05, -2.364441752433777e-05, -2.1646730601787567e-05, -1.9649043679237366e-05, -1.7651356756687164e-05, -1.5653669834136963e-05, -1.3655982911586761e-05, -1.165829598903656e-05, -9.660609066486359e-06, -7.662922143936157e-06, -5.665235221385956e-06, -3.6675482988357544e-06, -1.669861376285553e-06, 3.2782554626464844e-07, 2.32551246881485e-06, 4.323199391365051e-06, 6.320886313915253e-06, 8.318573236465454e-06, 1.0316260159015656e-05, 1.2313947081565857e-05, 1.4311634004116058e-05, 1.630932092666626e-05, 1.830700784921646e-05, 2.0304694771766663e-05, 2.2302381694316864e-05, 2.4300068616867065e-05, 2.6297755539417267e-05, 2.8295442461967468e-05, 3.029312938451767e-05, 3.229081630706787e-05, 3.428850322961807e-05, 3.6286190152168274e-05, 3.8283877074718475e-05, 4.028156399726868e-05, 4.227925091981888e-05, 4.427693784236908e-05, 4.627462476491928e-05, 4.827231168746948e-05, 5.0269998610019684e-05, 5.2267685532569885e-05, 5.426537245512009e-05, 5.626305937767029e-05, 5.826074630022049e-05, 6.025843322277069e-05, 6.225612014532089e-05, 6.42538070678711e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 7.0, 7.0, 7.0, 5.0, 12.0, 26.0, 20.0, 27.0, 30.0, 50.0, 77.0, 76.0, 121.0, 165.0, 213.0, 350.0, 529.0, 848.0, 1483.0, 2891.0, 6320.0, 16259.0, 57081.0, 338537.0, 525284.0, 65938.0, 18141.0, 6780.0, 3144.0, 1516.0, 895.0, 496.0, 318.0, 263.0, 196.0, 123.0, 98.0, 66.0, 34.0, 19.0, 25.0, 16.0, 13.0, 14.0, 8.0, 10.0, 10.0, 9.0, 4.0, 4.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.1385498046875, -0.13435745239257812, -0.13016510009765625, -0.12597274780273438, -0.1217803955078125, -0.11758804321289062, -0.11339569091796875, -0.10920333862304688, -0.105010986328125, -0.10081863403320312, -0.09662628173828125, -0.09243392944335938, -0.0882415771484375, -0.08404922485351562, -0.07985687255859375, -0.07566452026367188, -0.07147216796875, -0.06727981567382812, -0.06308746337890625, -0.058895111083984375, -0.0547027587890625, -0.050510406494140625, -0.04631805419921875, -0.042125701904296875, -0.037933349609375, -0.033740997314453125, -0.02954864501953125, -0.025356292724609375, -0.0211639404296875, -0.016971588134765625, -0.01277923583984375, -0.008586883544921875, -0.00439453125, -0.000202178955078125, 0.00399017333984375, 0.008182525634765625, 0.0123748779296875, 0.016567230224609375, 0.02075958251953125, 0.024951934814453125, 0.029144287109375, 0.033336639404296875, 0.03752899169921875, 0.041721343994140625, 0.0459136962890625, 0.050106048583984375, 0.05429840087890625, 0.058490753173828125, 0.06268310546875, 0.06687545776367188, 0.07106781005859375, 0.07526016235351562, 0.0794525146484375, 0.08364486694335938, 0.08783721923828125, 0.09202957153320312, 0.096221923828125, 0.10041427612304688, 0.10460662841796875, 0.10879898071289062, 0.1129913330078125, 0.11718368530273438, 0.12137603759765625, 0.12556838989257812, 0.1297607421875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 4.0, 6.0, 9.0, 9.0, 18.0, 18.0, 21.0, 23.0, 28.0, 43.0, 70.0, 66.0, 88.0, 74.0, 93.0, 105.0, 89.0, 48.0, 35.0, 36.0, 24.0, 21.0, 21.0, 9.0, 10.0, 9.0, 5.0, 9.0, 2.0, 3.0, 5.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1690673828125, -0.16423606872558594, -0.15940475463867188, -0.1545734405517578, -0.14974212646484375, -0.1449108123779297, -0.14007949829101562, -0.13524818420410156, -0.1304168701171875, -0.12558555603027344, -0.12075424194335938, -0.11592292785644531, -0.11109161376953125, -0.10626029968261719, -0.10142898559570312, -0.09659767150878906, -0.091766357421875, -0.08693504333496094, -0.08210372924804688, -0.07727241516113281, -0.07244110107421875, -0.06760978698730469, -0.06277847290039062, -0.05794715881347656, -0.0531158447265625, -0.04828453063964844, -0.043453216552734375, -0.03862190246582031, -0.03379058837890625, -0.028959274291992188, -0.024127960205078125, -0.019296646118164062, -0.01446533203125, -0.009634017944335938, -0.004802703857421875, 2.86102294921875e-05, 0.00485992431640625, 0.009691238403320312, 0.014522552490234375, 0.019353866577148438, 0.0241851806640625, 0.029016494750976562, 0.033847808837890625, 0.03867912292480469, 0.04351043701171875, 0.04834175109863281, 0.053173065185546875, 0.05800437927246094, 0.062835693359375, 0.06766700744628906, 0.07249832153320312, 0.07732963562011719, 0.08216094970703125, 0.08699226379394531, 0.09182357788085938, 0.09665489196777344, 0.1014862060546875, 0.10631752014160156, 0.11114883422851562, 0.11598014831542969, 0.12081146240234375, 0.1256427764892578, 0.13047409057617188, 0.13530540466308594, 0.14013671875]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 9.0, 6.0, 16.0, 74.0, 228.0, 483.0, 134.0, 36.0, 13.0, 5.0, 5.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.729398727416992, -4.525608062744141, -4.321817398071289, -4.1180267333984375, -3.914236068725586, -3.7104454040527344, -3.506654739379883, -3.3028640747070312, -3.0990734100341797, -2.895282745361328, -2.6914920806884766, -2.487701416015625, -2.2839107513427734, -2.080120086669922, -1.8763294219970703, -1.6725387573242188, -1.4687480926513672, -1.2649574279785156, -1.061166763305664, -0.8573760986328125, -0.6535854339599609, -0.4497947692871094, -0.2460041046142578, -0.04221343994140625, 0.1615772247314453, 0.3653678894042969, 0.5691585540771484, 0.77294921875, 0.9767398834228516, 1.1805305480957031, 1.3843212127685547, 1.5881118774414062, 1.7919025421142578, 1.9956932067871094, 2.199483871459961, 2.4032745361328125, 2.607065200805664, 2.8108558654785156, 3.014646530151367, 3.2184371948242188, 3.4222278594970703, 3.626018524169922, 3.8298091888427734, 4.033599853515625, 4.237390518188477, 4.441181182861328, 4.64497184753418, 4.848762512207031, 5.052553176879883, 5.256343841552734, 5.460134506225586, 5.6639251708984375, 5.867715835571289, 6.071506500244141, 6.275297164916992, 6.479087829589844, 6.682878494262695, 6.886669158935547, 7.090459823608398, 7.29425048828125, 7.498041152954102, 7.701831817626953, 7.905622482299805, 8.109413146972656, 8.313203811645508]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 5.0, 6.0, 2.0, 7.0, 7.0, 10.0, 9.0, 11.0, 9.0, 23.0, 22.0, 27.0, 41.0, 28.0, 24.0, 40.0, 37.0, 25.0, 37.0, 56.0, 57.0, 54.0, 50.0, 57.0, 63.0, 38.0, 31.0, 33.0, 21.0, 21.0, 21.0, 20.0, 19.0, 16.0, 16.0, 10.0, 13.0, 7.0, 8.0, 5.0, 3.0, 7.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6205451488494873, -1.5670948028564453, -1.5136444568634033, -1.4601942300796509, -1.4067438840866089, -1.353293538093567, -1.2998433113098145, -1.2463929653167725, -1.1929426193237305, -1.1394922733306885, -1.0860419273376465, -1.032591700553894, -0.979141354560852, -0.9256910085678101, -0.8722407221794128, -0.8187904357910156, -0.7653400897979736, -0.7118897438049316, -0.6584394574165344, -0.6049891710281372, -0.5515388250350952, -0.4980885088443756, -0.444638192653656, -0.3911878764629364, -0.3377375602722168, -0.2842872440814972, -0.2308369278907776, -0.17738661170005798, -0.12393629550933838, -0.07048597931861877, -0.01703566312789917, 0.036414653062820435, 0.08986496925354004, 0.14331528544425964, 0.19676560163497925, 0.25021591782569885, 0.30366623401641846, 0.35711655020713806, 0.41056686639785767, 0.46401718258857727, 0.5174674987792969, 0.5709178447723389, 0.6243681311607361, 0.6778184175491333, 0.7312687635421753, 0.7847191095352173, 0.8381693959236145, 0.8916196823120117, 0.9450700283050537, 0.9985203742980957, 1.0519707202911377, 1.1054209470748901, 1.1588712930679321, 1.2123216390609741, 1.2657718658447266, 1.3192222118377686, 1.3726725578308105, 1.4261229038238525, 1.4795732498168945, 1.533023476600647, 1.586473822593689, 1.639924168586731, 1.6933743953704834, 1.7468247413635254, 1.8002750873565674]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 6.0, 7.0, 16.0, 19.0, 21.0, 38.0, 83.0, 98.0, 169.0, 315.0, 680.0, 1328.0, 3329.0, 10317.0, 49729.0, 605302.0, 3132854.0, 344786.0, 32764.0, 7463.0, 2626.0, 1121.0, 567.0, 254.0, 139.0, 87.0, 60.0, 36.0, 21.0, 12.0, 8.0, 7.0, 3.0, 3.0, 3.0, 4.0, 6.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1488037109375, -0.14270591735839844, -0.13660812377929688, -0.1305103302001953, -0.12441253662109375, -0.11831474304199219, -0.11221694946289062, -0.10611915588378906, -0.1000213623046875, -0.09392356872558594, -0.08782577514648438, -0.08172798156738281, -0.07563018798828125, -0.06953239440917969, -0.06343460083007812, -0.05733680725097656, -0.051239013671875, -0.04514122009277344, -0.039043426513671875, -0.03294563293457031, -0.02684783935546875, -0.020750045776367188, -0.014652252197265625, -0.008554458618164062, -0.0024566650390625, 0.0036411285400390625, 0.009738922119140625, 0.015836715698242188, 0.02193450927734375, 0.028032302856445312, 0.034130096435546875, 0.04022789001464844, 0.04632568359375, 0.05242347717285156, 0.058521270751953125, 0.06461906433105469, 0.07071685791015625, 0.07681465148925781, 0.08291244506835938, 0.08901023864746094, 0.0951080322265625, 0.10120582580566406, 0.10730361938476562, 0.11340141296386719, 0.11949920654296875, 0.1255970001220703, 0.13169479370117188, 0.13779258728027344, 0.143890380859375, 0.14998817443847656, 0.15608596801757812, 0.1621837615966797, 0.16828155517578125, 0.1743793487548828, 0.18047714233398438, 0.18657493591308594, 0.1926727294921875, 0.19877052307128906, 0.20486831665039062, 0.2109661102294922, 0.21706390380859375, 0.2231616973876953, 0.22925949096679688, 0.23535728454589844, 0.241455078125]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 7.0, 7.0, 4.0, 12.0, 15.0, 25.0, 41.0, 52.0, 49.0, 69.0, 76.0, 72.0, 78.0, 69.0, 89.0, 77.0, 75.0, 47.0, 33.0, 21.0, 31.0, 16.0, 12.0, 5.0, 6.0, 3.0, 6.0, 4.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.155517578125, -0.14977645874023438, -0.14403533935546875, -0.13829421997070312, -0.1325531005859375, -0.12681198120117188, -0.12107086181640625, -0.11532974243164062, -0.109588623046875, -0.10384750366210938, -0.09810638427734375, -0.09236526489257812, -0.0866241455078125, -0.08088302612304688, -0.07514190673828125, -0.06940078735351562, -0.06365966796875, -0.057918548583984375, -0.05217742919921875, -0.046436309814453125, -0.0406951904296875, -0.034954071044921875, -0.02921295166015625, -0.023471832275390625, -0.017730712890625, -0.011989593505859375, -0.00624847412109375, -0.000507354736328125, 0.0052337646484375, 0.010974884033203125, 0.01671600341796875, 0.022457122802734375, 0.0281982421875, 0.033939361572265625, 0.03968048095703125, 0.045421600341796875, 0.0511627197265625, 0.056903839111328125, 0.06264495849609375, 0.06838607788085938, 0.074127197265625, 0.07986831665039062, 0.08560943603515625, 0.09135055541992188, 0.0970916748046875, 0.10283279418945312, 0.10857391357421875, 0.11431503295898438, 0.12005615234375, 0.12579727172851562, 0.13153839111328125, 0.13727951049804688, 0.1430206298828125, 0.14876174926757812, 0.15450286865234375, 0.16024398803710938, 0.165985107421875, 0.17172622680664062, 0.17746734619140625, 0.18320846557617188, 0.1889495849609375, 0.19469070434570312, 0.20043182373046875, 0.20617294311523438, 0.2119140625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 6.0, 3.0, 3.0, 5.0, 5.0, 12.0, 5.0, 15.0, 25.0, 49.0, 71.0, 97.0, 160.0, 321.0, 589.0, 1034.0, 2155.0, 5270.0, 15900.0, 75454.0, 1097958.0, 2790783.0, 164776.0, 26761.0, 7352.0, 2671.0, 1198.0, 675.0, 359.0, 195.0, 130.0, 83.0, 54.0, 42.0, 33.0, 15.0, 11.0, 7.0, 7.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1868896484375, -0.1797504425048828, -0.17261123657226562, -0.16547203063964844, -0.15833282470703125, -0.15119361877441406, -0.14405441284179688, -0.1369152069091797, -0.1297760009765625, -0.12263679504394531, -0.11549758911132812, -0.10835838317871094, -0.10121917724609375, -0.09407997131347656, -0.08694076538085938, -0.07980155944824219, -0.072662353515625, -0.06552314758300781, -0.058383941650390625, -0.05124473571777344, -0.04410552978515625, -0.03696632385253906, -0.029827117919921875, -0.022687911987304688, -0.0155487060546875, -0.008409500122070312, -0.001270294189453125, 0.0058689117431640625, 0.01300811767578125, 0.020147323608398438, 0.027286529541015625, 0.03442573547363281, 0.04156494140625, 0.04870414733886719, 0.055843353271484375, 0.06298255920410156, 0.07012176513671875, 0.07726097106933594, 0.08440017700195312, 0.09153938293457031, 0.0986785888671875, 0.10581779479980469, 0.11295700073242188, 0.12009620666503906, 0.12723541259765625, 0.13437461853027344, 0.14151382446289062, 0.1486530303955078, 0.155792236328125, 0.1629314422607422, 0.17007064819335938, 0.17720985412597656, 0.18434906005859375, 0.19148826599121094, 0.19862747192382812, 0.2057666778564453, 0.2129058837890625, 0.2200450897216797, 0.22718429565429688, 0.23432350158691406, 0.24146270751953125, 0.24860191345214844, 0.2557411193847656, 0.2628803253173828, 0.27001953125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 8.0, 8.0, 15.0, 19.0, 22.0, 39.0, 73.0, 125.0, 253.0, 461.0, 843.0, 900.0, 574.0, 334.0, 146.0, 84.0, 48.0, 39.0, 19.0, 20.0, 13.0, 12.0, 2.0, 3.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.33056640625, -0.3205986022949219, -0.31063079833984375, -0.3006629943847656, -0.2906951904296875, -0.2807273864746094, -0.27075958251953125, -0.2607917785644531, -0.250823974609375, -0.24085617065429688, -0.23088836669921875, -0.22092056274414062, -0.2109527587890625, -0.20098495483398438, -0.19101715087890625, -0.18104934692382812, -0.17108154296875, -0.16111373901367188, -0.15114593505859375, -0.14117813110351562, -0.1312103271484375, -0.12124252319335938, -0.11127471923828125, -0.10130691528320312, -0.091339111328125, -0.08137130737304688, -0.07140350341796875, -0.061435699462890625, -0.0514678955078125, -0.041500091552734375, -0.03153228759765625, -0.021564483642578125, -0.0115966796875, -0.001628875732421875, 0.00833892822265625, 0.018306732177734375, 0.0282745361328125, 0.038242340087890625, 0.04821014404296875, 0.058177947998046875, 0.068145751953125, 0.07811355590820312, 0.08808135986328125, 0.09804916381835938, 0.1080169677734375, 0.11798477172851562, 0.12795257568359375, 0.13792037963867188, 0.14788818359375, 0.15785598754882812, 0.16782379150390625, 0.17779159545898438, 0.1877593994140625, 0.19772720336914062, 0.20769500732421875, 0.21766281127929688, 0.227630615234375, 0.23759841918945312, 0.24756622314453125, 0.2575340270996094, 0.2675018310546875, 0.2774696350097656, 0.28743743896484375, 0.2974052429199219, 0.307373046875]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 3.0, 3.0, 9.0, 13.0, 51.0, 124.0, 255.0, 275.0, 159.0, 52.0, 34.0, 8.0, 9.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.749657392501831, -3.6328115463256836, -3.5159659385681152, -3.3991200923919678, -3.2822744846343994, -3.165428638458252, -3.0485830307006836, -2.931737184524536, -2.8148913383483887, -2.698045492172241, -2.581199884414673, -2.4643540382385254, -2.347508430480957, -2.2306625843048096, -2.113816738128662, -1.9969711303710938, -1.8801255226135254, -1.7632797956466675, -1.6464340686798096, -1.529588222503662, -1.4127426147460938, -1.2958967685699463, -1.1790510416030884, -1.0622053146362305, -0.9453595876693726, -0.8285138607025146, -0.7116681337356567, -0.594822347164154, -0.47797662019729614, -0.36113089323043823, -0.24428510665893555, -0.12743937969207764, -0.010593414306640625, 0.10625232756137848, 0.22309806942939758, 0.3399438261985779, 0.4567895531654358, 0.5736352801322937, 0.6904810667037964, 0.8073267936706543, 0.9241725206375122, 1.0410182476043701, 1.157863974571228, 1.274709701538086, 1.3915555477142334, 1.5084011554718018, 1.6252470016479492, 1.7420927286148071, 1.858938455581665, 1.975784182548523, 2.092629909515381, 2.2094757556915283, 2.3263213634490967, 2.443167209625244, 2.5600128173828125, 2.67685866355896, 2.7937045097351074, 2.910550355911255, 3.0273959636688232, 3.1442418098449707, 3.261087417602539, 3.3779332637786865, 3.494779109954834, 3.6116247177124023, 3.7284703254699707]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 0.0, 1.0, 4.0, 3.0, 6.0, 8.0, 13.0, 15.0, 23.0, 25.0, 24.0, 23.0, 28.0, 43.0, 46.0, 46.0, 54.0, 53.0, 68.0, 58.0, 58.0, 70.0, 56.0, 50.0, 48.0, 43.0, 23.0, 30.0, 20.0, 13.0, 15.0, 12.0, 7.0, 7.0, 7.0, 3.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3352372646331787, -1.292466402053833, -1.2496955394744873, -1.2069246768951416, -1.1641539335250854, -1.1213830709457397, -1.078612208366394, -1.0358413457870483, -0.9930705428123474, -0.9502996802330017, -0.9075288772583008, -0.8647580146789551, -0.8219871520996094, -0.7792163491249084, -0.7364454865455627, -0.6936746835708618, -0.6509038209915161, -0.6081329584121704, -0.5653621554374695, -0.5225912928581238, -0.47982046008110046, -0.43704962730407715, -0.39427876472473145, -0.35150793194770813, -0.3087370991706848, -0.2659662663936615, -0.223195418715477, -0.18042457103729248, -0.13765373826026917, -0.09488290548324585, -0.052112042903900146, -0.009341210126876831, 0.033429503440856934, 0.07620034366846085, 0.11897118389606476, 0.16174203157424927, 0.20451286435127258, 0.2472836971282959, 0.2900545597076416, 0.3328253924846649, 0.37559622526168823, 0.41836705803871155, 0.46113789081573486, 0.5039087533950806, 0.5466796159744263, 0.5894504189491272, 0.6322212815284729, 0.6749920845031738, 0.7177629470825195, 0.7605338096618652, 0.8033046126365662, 0.8460754752159119, 0.8888462781906128, 0.9316171407699585, 0.9743880033493042, 1.01715886592865, 1.059929609298706, 1.1027004718780518, 1.1454713344573975, 1.1882421970367432, 1.2310129404067993, 1.273783802986145, 1.3165546655654907, 1.3593255281448364, 1.4020963907241821]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 4.0, 1.0, 0.0, 3.0, 9.0, 8.0, 16.0, 22.0, 15.0, 34.0, 47.0, 105.0, 174.0, 289.0, 562.0, 1118.0, 2405.0, 5979.0, 18251.0, 72091.0, 334520.0, 465959.0, 107239.0, 25963.0, 7782.0, 3024.0, 1387.0, 658.0, 390.0, 215.0, 106.0, 54.0, 35.0, 22.0, 16.0, 16.0, 20.0, 4.0, 6.0, 4.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.271484375, -0.26375770568847656, -0.2560310363769531, -0.2483043670654297, -0.24057769775390625, -0.2328510284423828, -0.22512435913085938, -0.21739768981933594, -0.2096710205078125, -0.20194435119628906, -0.19421768188476562, -0.1864910125732422, -0.17876434326171875, -0.1710376739501953, -0.16331100463867188, -0.15558433532714844, -0.147857666015625, -0.14013099670410156, -0.13240432739257812, -0.12467765808105469, -0.11695098876953125, -0.10922431945800781, -0.10149765014648438, -0.09377098083496094, -0.0860443115234375, -0.07831764221191406, -0.07059097290039062, -0.06286430358886719, -0.05513763427734375, -0.04741096496582031, -0.039684295654296875, -0.03195762634277344, -0.02423095703125, -0.016504287719726562, -0.008777618408203125, -0.0010509490966796875, 0.00667572021484375, 0.014402389526367188, 0.022129058837890625, 0.029855728149414062, 0.0375823974609375, 0.04530906677246094, 0.053035736083984375, 0.06076240539550781, 0.06848907470703125, 0.07621574401855469, 0.08394241333007812, 0.09166908264160156, 0.099395751953125, 0.10712242126464844, 0.11484909057617188, 0.12257575988769531, 0.13030242919921875, 0.1380290985107422, 0.14575576782226562, 0.15348243713378906, 0.1612091064453125, 0.16893577575683594, 0.17666244506835938, 0.1843891143798828, 0.19211578369140625, 0.1998424530029297, 0.20756912231445312, 0.21529579162597656, 0.2230224609375]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 5.0, 6.0, 11.0, 13.0, 25.0, 21.0, 31.0, 49.0, 59.0, 67.0, 75.0, 68.0, 72.0, 74.0, 74.0, 77.0, 61.0, 48.0, 40.0, 38.0, 22.0, 22.0, 13.0, 6.0, 7.0, 10.0, 3.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1483154296875, -0.14284706115722656, -0.13737869262695312, -0.1319103240966797, -0.12644195556640625, -0.12097358703613281, -0.11550521850585938, -0.11003684997558594, -0.1045684814453125, -0.09910011291503906, -0.09363174438476562, -0.08816337585449219, -0.08269500732421875, -0.07722663879394531, -0.07175827026367188, -0.06628990173339844, -0.060821533203125, -0.05535316467285156, -0.049884796142578125, -0.04441642761230469, -0.03894805908203125, -0.03347969055175781, -0.028011322021484375, -0.022542953491210938, -0.0170745849609375, -0.011606216430664062, -0.006137847900390625, -0.0006694793701171875, 0.00479888916015625, 0.010267257690429688, 0.015735626220703125, 0.021203994750976562, 0.02667236328125, 0.03214073181152344, 0.037609100341796875, 0.04307746887207031, 0.04854583740234375, 0.05401420593261719, 0.059482574462890625, 0.06495094299316406, 0.0704193115234375, 0.07588768005371094, 0.08135604858398438, 0.08682441711425781, 0.09229278564453125, 0.09776115417480469, 0.10322952270507812, 0.10869789123535156, 0.114166259765625, 0.11963462829589844, 0.12510299682617188, 0.1305713653564453, 0.13603973388671875, 0.1415081024169922, 0.14697647094726562, 0.15244483947753906, 0.1579132080078125, 0.16338157653808594, 0.16884994506835938, 0.1743183135986328, 0.17978668212890625, 0.1852550506591797, 0.19072341918945312, 0.19619178771972656, 0.20166015625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 9.0, 5.0, 6.0, 15.0, 10.0, 22.0, 24.0, 31.0, 61.0, 72.0, 105.0, 165.0, 270.0, 506.0, 891.0, 1866.0, 5557.0, 26486.0, 286020.0, 668721.0, 45120.0, 7676.0, 2335.0, 1062.0, 558.0, 306.0, 201.0, 137.0, 89.0, 76.0, 46.0, 32.0, 17.0, 13.0, 10.0, 7.0, 9.0, 8.0, 4.0, 6.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.423095703125, -0.4095039367675781, -0.39591217041015625, -0.3823204040527344, -0.3687286376953125, -0.3551368713378906, -0.34154510498046875, -0.3279533386230469, -0.314361572265625, -0.3007698059082031, -0.28717803955078125, -0.2735862731933594, -0.2599945068359375, -0.24640274047851562, -0.23281097412109375, -0.21921920776367188, -0.20562744140625, -0.19203567504882812, -0.17844390869140625, -0.16485214233398438, -0.1512603759765625, -0.13766860961914062, -0.12407684326171875, -0.11048507690429688, -0.096893310546875, -0.08330154418945312, -0.06970977783203125, -0.056118011474609375, -0.0425262451171875, -0.028934478759765625, -0.01534271240234375, -0.001750946044921875, 0.0118408203125, 0.025432586669921875, 0.03902435302734375, 0.052616119384765625, 0.0662078857421875, 0.07979965209960938, 0.09339141845703125, 0.10698318481445312, 0.120574951171875, 0.13416671752929688, 0.14775848388671875, 0.16135025024414062, 0.1749420166015625, 0.18853378295898438, 0.20212554931640625, 0.21571731567382812, 0.22930908203125, 0.24290084838867188, 0.25649261474609375, 0.2700843811035156, 0.2836761474609375, 0.2972679138183594, 0.31085968017578125, 0.3244514465332031, 0.338043212890625, 0.3516349792480469, 0.36522674560546875, 0.3788185119628906, 0.3924102783203125, 0.4060020446777344, 0.41959381103515625, 0.4331855773925781, 0.44677734375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 5.0, 5.0, 6.0, 16.0, 19.0, 21.0, 25.0, 21.0, 48.0, 57.0, 55.0, 45.0, 80.0, 59.0, 71.0, 80.0, 45.0, 51.0, 61.0, 48.0, 36.0, 26.0, 27.0, 25.0, 21.0, 17.0, 11.0, 9.0, 5.0, 1.0, 5.0, 3.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.486083984375, -0.4671974182128906, -0.44831085205078125, -0.4294242858886719, -0.4105377197265625, -0.3916511535644531, -0.37276458740234375, -0.3538780212402344, -0.334991455078125, -0.3161048889160156, -0.29721832275390625, -0.2783317565917969, -0.2594451904296875, -0.24055862426757812, -0.22167205810546875, -0.20278549194335938, -0.18389892578125, -0.16501235961914062, -0.14612579345703125, -0.12723922729492188, -0.1083526611328125, -0.08946609497070312, -0.07057952880859375, -0.051692962646484375, -0.032806396484375, -0.013919830322265625, 0.00496673583984375, 0.023853302001953125, 0.0427398681640625, 0.061626434326171875, 0.08051300048828125, 0.09939956665039062, 0.1182861328125, 0.13717269897460938, 0.15605926513671875, 0.17494583129882812, 0.1938323974609375, 0.21271896362304688, 0.23160552978515625, 0.2504920959472656, 0.269378662109375, 0.2882652282714844, 0.30715179443359375, 0.3260383605957031, 0.3449249267578125, 0.3638114929199219, 0.38269805908203125, 0.4015846252441406, 0.42047119140625, 0.4393577575683594, 0.45824432373046875, 0.4771308898925781, 0.4960174560546875, 0.5149040222167969, 0.5337905883789062, 0.5526771545410156, 0.571563720703125, 0.5904502868652344, 0.6093368530273438, 0.6282234191894531, 0.6471099853515625, 0.6659965515136719, 0.6848831176757812, 0.7037696838378906, 0.72265625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 5.0, 9.0, 6.0, 23.0, 44.0, 97.0, 174.0, 544.0, 2628.0, 50433.0, 958496.0, 33275.0, 2008.0, 483.0, 172.0, 60.0, 41.0, 20.0, 15.0, 9.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.6201171875, -0.6055068969726562, -0.5908966064453125, -0.5762863159179688, -0.561676025390625, -0.5470657348632812, -0.5324554443359375, -0.5178451538085938, -0.50323486328125, -0.48862457275390625, -0.4740142822265625, -0.45940399169921875, -0.444793701171875, -0.43018341064453125, -0.4155731201171875, -0.40096282958984375, -0.3863525390625, -0.37174224853515625, -0.3571319580078125, -0.34252166748046875, -0.327911376953125, -0.31330108642578125, -0.2986907958984375, -0.28408050537109375, -0.26947021484375, -0.25485992431640625, -0.2402496337890625, -0.22563934326171875, -0.211029052734375, -0.19641876220703125, -0.1818084716796875, -0.16719818115234375, -0.152587890625, -0.13797760009765625, -0.1233673095703125, -0.10875701904296875, -0.094146728515625, -0.07953643798828125, -0.0649261474609375, -0.05031585693359375, -0.03570556640625, -0.02109527587890625, -0.0064849853515625, 0.00812530517578125, 0.022735595703125, 0.03734588623046875, 0.0519561767578125, 0.06656646728515625, 0.0811767578125, 0.09578704833984375, 0.1103973388671875, 0.12500762939453125, 0.139617919921875, 0.15422821044921875, 0.1688385009765625, 0.18344879150390625, 0.19805908203125, 0.21266937255859375, 0.2272796630859375, 0.24188995361328125, 0.256500244140625, 0.27111053466796875, 0.2857208251953125, 0.30033111572265625, 0.31494140625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 4.0, 5.0, 4.0, 4.0, 8.0, 7.0, 7.0, 8.0, 12.0, 19.0, 19.0, 24.0, 34.0, 53.0, 81.0, 101.0, 100.0, 97.0, 94.0, 76.0, 50.0, 34.0, 36.0, 24.0, 14.0, 22.0, 16.0, 6.0, 8.0, 3.0, 8.0, 3.0, 5.0, 8.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.198883056640625e-05, -6.000697612762451e-05, -5.8025121688842773e-05, -5.6043267250061035e-05, -5.40614128112793e-05, -5.207955837249756e-05, -5.009770393371582e-05, -4.811584949493408e-05, -4.6133995056152344e-05, -4.4152140617370605e-05, -4.217028617858887e-05, -4.018843173980713e-05, -3.820657730102539e-05, -3.622472286224365e-05, -3.4242868423461914e-05, -3.2261013984680176e-05, -3.0279159545898438e-05, -2.82973051071167e-05, -2.631545066833496e-05, -2.4333596229553223e-05, -2.2351741790771484e-05, -2.0369887351989746e-05, -1.8388032913208008e-05, -1.640617847442627e-05, -1.4424324035644531e-05, -1.2442469596862793e-05, -1.0460615158081055e-05, -8.478760719299316e-06, -6.496906280517578e-06, -4.51505184173584e-06, -2.5331974029541016e-06, -5.513429641723633e-07, 1.430511474609375e-06, 3.4123659133911133e-06, 5.3942203521728516e-06, 7.37607479095459e-06, 9.357929229736328e-06, 1.1339783668518066e-05, 1.3321638107299805e-05, 1.5303492546081543e-05, 1.728534698486328e-05, 1.926720142364502e-05, 2.1249055862426758e-05, 2.3230910301208496e-05, 2.5212764739990234e-05, 2.7194619178771973e-05, 2.917647361755371e-05, 3.115832805633545e-05, 3.314018249511719e-05, 3.5122036933898926e-05, 3.7103891372680664e-05, 3.90857458114624e-05, 4.106760025024414e-05, 4.304945468902588e-05, 4.503130912780762e-05, 4.7013163566589355e-05, 4.8995018005371094e-05, 5.097687244415283e-05, 5.295872688293457e-05, 5.494058132171631e-05, 5.692243576049805e-05, 5.8904290199279785e-05, 6.0886144638061523e-05, 6.286799907684326e-05, 6.4849853515625e-05]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 4.0, 4.0, 4.0, 12.0, 15.0, 15.0, 23.0, 28.0, 52.0, 72.0, 94.0, 156.0, 220.0, 343.0, 580.0, 1074.0, 2370.0, 6193.0, 19751.0, 81089.0, 677399.0, 203977.0, 37442.0, 10432.0, 3570.0, 1599.0, 712.0, 438.0, 283.0, 194.0, 129.0, 85.0, 61.0, 46.0, 19.0, 19.0, 21.0, 16.0, 8.0, 3.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1519775390625, -0.14703369140625, -0.14208984375, -0.13714599609375, -0.1322021484375, -0.12725830078125, -0.122314453125, -0.11737060546875, -0.1124267578125, -0.10748291015625, -0.1025390625, -0.09759521484375, -0.0926513671875, -0.08770751953125, -0.082763671875, -0.07781982421875, -0.0728759765625, -0.06793212890625, -0.06298828125, -0.05804443359375, -0.0531005859375, -0.04815673828125, -0.043212890625, -0.03826904296875, -0.0333251953125, -0.02838134765625, -0.0234375, -0.01849365234375, -0.0135498046875, -0.00860595703125, -0.003662109375, 0.00128173828125, 0.0062255859375, 0.01116943359375, 0.01611328125, 0.02105712890625, 0.0260009765625, 0.03094482421875, 0.035888671875, 0.04083251953125, 0.0457763671875, 0.05072021484375, 0.0556640625, 0.06060791015625, 0.0655517578125, 0.07049560546875, 0.075439453125, 0.08038330078125, 0.0853271484375, 0.09027099609375, 0.09521484375, 0.10015869140625, 0.1051025390625, 0.11004638671875, 0.114990234375, 0.11993408203125, 0.1248779296875, 0.12982177734375, 0.134765625, 0.13970947265625, 0.1446533203125, 0.14959716796875, 0.154541015625, 0.15948486328125, 0.1644287109375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 6.0, 9.0, 7.0, 9.0, 12.0, 9.0, 15.0, 24.0, 34.0, 39.0, 57.0, 65.0, 108.0, 107.0, 115.0, 97.0, 65.0, 46.0, 43.0, 29.0, 32.0, 12.0, 10.0, 16.0, 8.0, 5.0, 13.0, 2.0, 6.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.123291015625, -0.11816596984863281, -0.11304092407226562, -0.10791587829589844, -0.10279083251953125, -0.09766578674316406, -0.09254074096679688, -0.08741569519042969, -0.0822906494140625, -0.07716560363769531, -0.07204055786132812, -0.06691551208496094, -0.06179046630859375, -0.05666542053222656, -0.051540374755859375, -0.04641532897949219, -0.041290283203125, -0.03616523742675781, -0.031040191650390625, -0.025915145874023438, -0.02079010009765625, -0.015665054321289062, -0.010540008544921875, -0.0054149627685546875, -0.0002899169921875, 0.0048351287841796875, 0.009960174560546875, 0.015085220336914062, 0.02021026611328125, 0.025335311889648438, 0.030460357666015625, 0.03558540344238281, 0.04071044921875, 0.04583549499511719, 0.050960540771484375, 0.05608558654785156, 0.06121063232421875, 0.06633567810058594, 0.07146072387695312, 0.07658576965332031, 0.0817108154296875, 0.08683586120605469, 0.09196090698242188, 0.09708595275878906, 0.10221099853515625, 0.10733604431152344, 0.11246109008789062, 0.11758613586425781, 0.122711181640625, 0.1278362274169922, 0.13296127319335938, 0.13808631896972656, 0.14321136474609375, 0.14833641052246094, 0.15346145629882812, 0.1585865020751953, 0.1637115478515625, 0.1688365936279297, 0.17396163940429688, 0.17908668518066406, 0.18421173095703125, 0.18933677673339844, 0.19446182250976562, 0.1995868682861328, 0.2047119140625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 7.0, 9.0, 15.0, 55.0, 165.0, 467.0, 205.0, 57.0, 14.0, 8.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4672179222106934, -3.280125856399536, -3.0930335521698, -2.9059414863586426, -2.7188491821289062, -2.531757116317749, -2.344665050506592, -2.1575727462768555, -1.9704806804656982, -1.7833884954452515, -1.5962963104248047, -1.4092042446136475, -1.2221120595932007, -1.035019874572754, -0.8479278087615967, -0.6608356237411499, -0.4737434387207031, -0.28665128350257874, -0.09955912828445435, 0.08753299713134766, 0.27462518215179443, 0.4617173671722412, 0.6488094329833984, 0.8359016180038452, 1.022993803024292, 1.2100859880447388, 1.3971781730651855, 1.5842702388763428, 1.7713624238967896, 1.9584546089172363, 2.1455466747283936, 2.332638740539551, 2.519730567932129, 2.706822633743286, 2.8939149379730225, 3.0810070037841797, 3.268099308013916, 3.4551913738250732, 3.6422834396362305, 3.829375743865967, 4.016468048095703, 4.2035603523254395, 4.390652179718018, 4.577744483947754, 4.76483678817749, 4.951929092407227, 5.139020919799805, 5.326113224029541, 5.513205051422119, 5.7002973556518555, 5.887389183044434, 6.07448148727417, 6.261573791503906, 6.448665618896484, 6.635757923126221, 6.822850227355957, 7.009942054748535, 7.1970343589782715, 7.38412618637085, 7.571218490600586, 7.758310794830322, 7.945403099060059, 8.132494926452637, 8.319586753845215, 8.50667953491211]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 2.0, 8.0, 3.0, 8.0, 5.0, 13.0, 14.0, 15.0, 11.0, 16.0, 19.0, 21.0, 25.0, 28.0, 31.0, 28.0, 37.0, 43.0, 58.0, 55.0, 57.0, 82.0, 41.0, 46.0, 37.0, 34.0, 33.0, 32.0, 24.0, 30.0, 19.0, 15.0, 19.0, 14.0, 10.0, 18.0, 7.0, 8.0, 6.0, 9.0, 3.0, 5.0, 6.0, 3.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.5590248107910156, -1.507304072380066, -1.4555834531784058, -1.403862714767456, -1.352142095565796, -1.3004213571548462, -1.2487006187438965, -1.1969799995422363, -1.1452593803405762, -1.0935386419296265, -1.0418180227279663, -0.9900972843170166, -0.9383766651153564, -0.8866559267044067, -0.8349352478981018, -0.7832145690917969, -0.7314938306808472, -0.6797731518745422, -0.6280524730682373, -0.5763317346572876, -0.5246111154556274, -0.4728904068470001, -0.4211696982383728, -0.36944901943206787, -0.31772834062576294, -0.266007661819458, -0.21428696811199188, -0.16256627440452576, -0.11084559559822083, -0.059124916791915894, -0.007404208183288574, 0.04431647062301636, 0.09603714942932129, 0.14775782823562622, 0.19947852194309235, 0.25119921565055847, 0.3029198944568634, 0.35464057326316833, 0.40636128187179565, 0.4580819606781006, 0.5098026394844055, 0.5615233182907104, 0.6132439970970154, 0.6649646759033203, 0.71668541431427, 0.7684060335159302, 0.8201267719268799, 0.8718474507331848, 0.9235681295394897, 0.9752888083457947, 1.0270094871520996, 1.0787302255630493, 1.1304508447647095, 1.1821715831756592, 1.2338922023773193, 1.285612940788269, 1.3373336791992188, 1.3890544176101685, 1.4407750368118286, 1.4924957752227783, 1.5442163944244385, 1.5959371328353882, 1.647657871246338, 1.699378490447998, 1.7510991096496582]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 5.0, 4.0, 6.0, 7.0, 17.0, 16.0, 37.0, 55.0, 105.0, 170.0, 332.0, 665.0, 1815.0, 6036.0, 35722.0, 1005313.0, 3039226.0, 89888.0, 10249.0, 2735.0, 968.0, 422.0, 207.0, 105.0, 73.0, 35.0, 23.0, 19.0, 13.0, 5.0, 8.0, 1.0, 3.0, 8.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2064208984375, -0.19788551330566406, -0.18935012817382812, -0.1808147430419922, -0.17227935791015625, -0.1637439727783203, -0.15520858764648438, -0.14667320251464844, -0.1381378173828125, -0.12960243225097656, -0.12106704711914062, -0.11253166198730469, -0.10399627685546875, -0.09546089172363281, -0.08692550659179688, -0.07839012145996094, -0.069854736328125, -0.06131935119628906, -0.052783966064453125, -0.04424858093261719, -0.03571319580078125, -0.027177810668945312, -0.018642425537109375, -0.010107040405273438, -0.0015716552734375, 0.0069637298583984375, 0.015499114990234375, 0.024034500122070312, 0.03256988525390625, 0.04110527038574219, 0.049640655517578125, 0.05817604064941406, 0.06671142578125, 0.07524681091308594, 0.08378219604492188, 0.09231758117675781, 0.10085296630859375, 0.10938835144042969, 0.11792373657226562, 0.12645912170410156, 0.1349945068359375, 0.14352989196777344, 0.15206527709960938, 0.1606006622314453, 0.16913604736328125, 0.1776714324951172, 0.18620681762695312, 0.19474220275878906, 0.203277587890625, 0.21181297302246094, 0.22034835815429688, 0.2288837432861328, 0.23741912841796875, 0.2459545135498047, 0.2544898986816406, 0.26302528381347656, 0.2715606689453125, 0.28009605407714844, 0.2886314392089844, 0.2971668243408203, 0.30570220947265625, 0.3142375946044922, 0.3227729797363281, 0.33130836486816406, 0.33984375]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 8.0, 9.0, 16.0, 22.0, 23.0, 28.0, 35.0, 45.0, 68.0, 68.0, 75.0, 88.0, 90.0, 56.0, 61.0, 66.0, 60.0, 49.0, 32.0, 29.0, 14.0, 18.0, 15.0, 8.0, 3.0, 5.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1324462890625, -0.12719345092773438, -0.12194061279296875, -0.11668777465820312, -0.1114349365234375, -0.10618209838867188, -0.10092926025390625, -0.09567642211914062, -0.090423583984375, -0.08517074584960938, -0.07991790771484375, -0.07466506958007812, -0.0694122314453125, -0.06415939331054688, -0.05890655517578125, -0.053653717041015625, -0.04840087890625, -0.043148040771484375, -0.03789520263671875, -0.032642364501953125, -0.0273895263671875, -0.022136688232421875, -0.01688385009765625, -0.011631011962890625, -0.006378173828125, -0.001125335693359375, 0.00412750244140625, 0.009380340576171875, 0.0146331787109375, 0.019886016845703125, 0.02513885498046875, 0.030391693115234375, 0.03564453125, 0.040897369384765625, 0.04615020751953125, 0.051403045654296875, 0.0566558837890625, 0.061908721923828125, 0.06716156005859375, 0.07241439819335938, 0.077667236328125, 0.08292007446289062, 0.08817291259765625, 0.09342575073242188, 0.0986785888671875, 0.10393142700195312, 0.10918426513671875, 0.11443710327148438, 0.11968994140625, 0.12494277954101562, 0.13019561767578125, 0.13544845581054688, 0.1407012939453125, 0.14595413208007812, 0.15120697021484375, 0.15645980834960938, 0.161712646484375, 0.16696548461914062, 0.17221832275390625, 0.17747116088867188, 0.1827239990234375, 0.18797683715820312, 0.19322967529296875, 0.19848251342773438, 0.2037353515625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 3.0, 8.0, 13.0, 24.0, 35.0, 46.0, 103.0, 193.0, 406.0, 1001.0, 3348.0, 16199.0, 416883.0, 3693354.0, 53263.0, 6448.0, 1770.0, 654.0, 272.0, 101.0, 54.0, 43.0, 22.0, 20.0, 4.0, 5.0, 7.0, 1.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.37158203125, -0.35794830322265625, -0.3443145751953125, -0.33068084716796875, -0.317047119140625, -0.30341339111328125, -0.2897796630859375, -0.27614593505859375, -0.26251220703125, -0.24887847900390625, -0.2352447509765625, -0.22161102294921875, -0.207977294921875, -0.19434356689453125, -0.1807098388671875, -0.16707611083984375, -0.1534423828125, -0.13980865478515625, -0.1261749267578125, -0.11254119873046875, -0.098907470703125, -0.08527374267578125, -0.0716400146484375, -0.05800628662109375, -0.04437255859375, -0.03073883056640625, -0.0171051025390625, -0.00347137451171875, 0.010162353515625, 0.02379608154296875, 0.0374298095703125, 0.05106353759765625, 0.064697265625, 0.07833099365234375, 0.0919647216796875, 0.10559844970703125, 0.119232177734375, 0.13286590576171875, 0.1464996337890625, 0.16013336181640625, 0.17376708984375, 0.18740081787109375, 0.2010345458984375, 0.21466827392578125, 0.228302001953125, 0.24193572998046875, 0.2555694580078125, 0.26920318603515625, 0.2828369140625, 0.29647064208984375, 0.3101043701171875, 0.32373809814453125, 0.337371826171875, 0.35100555419921875, 0.3646392822265625, 0.37827301025390625, 0.39190673828125, 0.40554046630859375, 0.4191741943359375, 0.43280792236328125, 0.446441650390625, 0.46007537841796875, 0.4737091064453125, 0.48734283447265625, 0.5009765625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 5.0, 6.0, 6.0, 7.0, 21.0, 19.0, 26.0, 54.0, 96.0, 164.0, 343.0, 601.0, 951.0, 824.0, 425.0, 243.0, 127.0, 57.0, 41.0, 12.0, 11.0, 11.0, 9.0, 2.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.304443359375, -0.2948760986328125, -0.285308837890625, -0.2757415771484375, -0.26617431640625, -0.2566070556640625, -0.247039794921875, -0.2374725341796875, -0.2279052734375, -0.2183380126953125, -0.208770751953125, -0.1992034912109375, -0.18963623046875, -0.1800689697265625, -0.170501708984375, -0.1609344482421875, -0.1513671875, -0.1417999267578125, -0.132232666015625, -0.1226654052734375, -0.11309814453125, -0.1035308837890625, -0.093963623046875, -0.0843963623046875, -0.0748291015625, -0.0652618408203125, -0.055694580078125, -0.0461273193359375, -0.03656005859375, -0.0269927978515625, -0.017425537109375, -0.0078582763671875, 0.001708984375, 0.0112762451171875, 0.020843505859375, 0.0304107666015625, 0.03997802734375, 0.0495452880859375, 0.059112548828125, 0.0686798095703125, 0.0782470703125, 0.0878143310546875, 0.097381591796875, 0.1069488525390625, 0.11651611328125, 0.1260833740234375, 0.135650634765625, 0.1452178955078125, 0.15478515625, 0.1643524169921875, 0.173919677734375, 0.1834869384765625, 0.19305419921875, 0.2026214599609375, 0.212188720703125, 0.2217559814453125, 0.2313232421875, 0.2408905029296875, 0.250457763671875, 0.2600250244140625, 0.26959228515625, 0.2791595458984375, 0.288726806640625, 0.2982940673828125, 0.307861328125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 9.0, 6.0, 13.0, 60.0, 187.0, 387.0, 237.0, 67.0, 20.0, 7.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.243610858917236, -7.094602108001709, -6.94559383392334, -6.7965850830078125, -6.647576332092285, -6.498568058013916, -6.349559307098389, -6.2005510330200195, -6.051542282104492, -5.902533531188965, -5.753525257110596, -5.604516506195068, -5.455508232116699, -5.306499481201172, -5.1574907302856445, -5.008481979370117, -4.859473705291748, -4.710464954376221, -4.561456680297852, -4.412447929382324, -4.263439178466797, -4.114430904388428, -3.9654221534729004, -3.816413640975952, -3.667405128479004, -3.5183966159820557, -3.3693881034851074, -3.22037935256958, -3.071370840072632, -2.9223623275756836, -2.7733535766601562, -2.624345064163208, -2.4753365516662598, -2.3263280391693115, -2.1773195266723633, -2.028310775756836, -1.8793022632598877, -1.7302937507629395, -1.5812851190567017, -1.4322764873504639, -1.2832679748535156, -1.1342594623565674, -0.9852508306503296, -0.8362422585487366, -0.6872336864471436, -0.5382251143455505, -0.3892165422439575, -0.24020791053771973, -0.09119939804077148, 0.05780917406082153, 0.20681774616241455, 0.35582631826400757, 0.5048348903656006, 0.6538434624671936, 0.8028520345687866, 0.9518606662750244, 1.1008691787719727, 1.249877691268921, 1.3988863229751587, 1.5478949546813965, 1.6969034671783447, 1.845911979675293, 1.9949206113815308, 2.1439292430877686, 2.292937755584717]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 3.0, 6.0, 5.0, 12.0, 10.0, 17.0, 24.0, 23.0, 22.0, 15.0, 28.0, 41.0, 51.0, 42.0, 49.0, 52.0, 49.0, 58.0, 54.0, 59.0, 51.0, 56.0, 60.0, 36.0, 26.0, 39.0, 28.0, 20.0, 22.0, 12.0, 8.0, 10.0, 3.0, 2.0, 2.0, 6.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0], "bins": [-1.3525437116622925, -1.3168846368789673, -1.2812256813049316, -1.2455666065216064, -1.2099075317382812, -1.174248456954956, -1.1385895013809204, -1.1029304265975952, -1.0672714710235596, -1.0316123962402344, -0.995953381061554, -0.9602943658828735, -0.9246352910995483, -0.8889762759208679, -0.8533172607421875, -0.8176581859588623, -0.7819991111755371, -0.7463400959968567, -0.7106810212135315, -0.6750220060348511, -0.6393629312515259, -0.6037039160728455, -0.568044900894165, -0.5323858261108398, -0.4967268109321594, -0.4610677659511566, -0.4254087209701538, -0.3897497057914734, -0.3540906608104706, -0.3184316158294678, -0.28277260065078735, -0.24711355566978455, -0.2114545702934265, -0.1757955253124237, -0.1401364952325821, -0.10447745770215988, -0.06881842017173767, -0.03315937519073486, 0.0024996548891067505, 0.038158684968948364, 0.07381772994995117, 0.10947676748037338, 0.1451358050107956, 0.1807948350906372, 0.21645388007164001, 0.2521129250526428, 0.28777194023132324, 0.32343098521232605, 0.35909003019332886, 0.39474907517433167, 0.4304081201553345, 0.4660671353340149, 0.5017261505126953, 0.5373852252960205, 0.5730442404747009, 0.6087032556533813, 0.6443623304367065, 0.680021345615387, 0.7156804203987122, 0.7513394355773926, 0.7869985103607178, 0.8226575255393982, 0.8583165407180786, 0.8939756155014038, 0.9296346306800842]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 4.0, 2.0, 4.0, 1.0, 5.0, 6.0, 9.0, 13.0, 13.0, 30.0, 38.0, 42.0, 62.0, 119.0, 174.0, 300.0, 535.0, 997.0, 2067.0, 4803.0, 12622.0, 39549.0, 158708.0, 459028.0, 270080.0, 67153.0, 19480.0, 6765.0, 2939.0, 1323.0, 696.0, 394.0, 204.0, 118.0, 97.0, 45.0, 39.0, 20.0, 20.0, 13.0, 21.0, 4.0, 6.0, 4.0, 2.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17822265625, -0.17241668701171875, -0.1666107177734375, -0.16080474853515625, -0.154998779296875, -0.14919281005859375, -0.1433868408203125, -0.13758087158203125, -0.13177490234375, -0.12596893310546875, -0.1201629638671875, -0.11435699462890625, -0.108551025390625, -0.10274505615234375, -0.0969390869140625, -0.09113311767578125, -0.0853271484375, -0.07952117919921875, -0.0737152099609375, -0.06790924072265625, -0.062103271484375, -0.05629730224609375, -0.0504913330078125, -0.04468536376953125, -0.03887939453125, -0.03307342529296875, -0.0272674560546875, -0.02146148681640625, -0.015655517578125, -0.00984954833984375, -0.0040435791015625, 0.00176239013671875, 0.007568359375, 0.01337432861328125, 0.0191802978515625, 0.02498626708984375, 0.030792236328125, 0.03659820556640625, 0.0424041748046875, 0.04821014404296875, 0.05401611328125, 0.05982208251953125, 0.0656280517578125, 0.07143402099609375, 0.077239990234375, 0.08304595947265625, 0.0888519287109375, 0.09465789794921875, 0.1004638671875, 0.10626983642578125, 0.1120758056640625, 0.11788177490234375, 0.123687744140625, 0.12949371337890625, 0.1352996826171875, 0.14110565185546875, 0.14691162109375, 0.15271759033203125, 0.1585235595703125, 0.16432952880859375, 0.170135498046875, 0.17594146728515625, 0.1817474365234375, 0.18755340576171875, 0.193359375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 7.0, 6.0, 7.0, 14.0, 15.0, 25.0, 31.0, 26.0, 45.0, 54.0, 50.0, 78.0, 65.0, 86.0, 60.0, 64.0, 81.0, 55.0, 45.0, 45.0, 40.0, 23.0, 16.0, 18.0, 15.0, 7.0, 9.0, 5.0, 2.0, 1.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1424560546875, -0.13736724853515625, -0.1322784423828125, -0.12718963623046875, -0.122100830078125, -0.11701202392578125, -0.1119232177734375, -0.10683441162109375, -0.10174560546875, -0.09665679931640625, -0.0915679931640625, -0.08647918701171875, -0.081390380859375, -0.07630157470703125, -0.0712127685546875, -0.06612396240234375, -0.06103515625, -0.05594635009765625, -0.0508575439453125, -0.04576873779296875, -0.040679931640625, -0.03559112548828125, -0.0305023193359375, -0.02541351318359375, -0.02032470703125, -0.01523590087890625, -0.0101470947265625, -0.00505828857421875, 3.0517578125e-05, 0.00511932373046875, 0.0102081298828125, 0.01529693603515625, 0.0203857421875, 0.02547454833984375, 0.0305633544921875, 0.03565216064453125, 0.040740966796875, 0.04582977294921875, 0.0509185791015625, 0.05600738525390625, 0.06109619140625, 0.06618499755859375, 0.0712738037109375, 0.07636260986328125, 0.081451416015625, 0.08654022216796875, 0.0916290283203125, 0.09671783447265625, 0.101806640625, 0.10689544677734375, 0.1119842529296875, 0.11707305908203125, 0.122161865234375, 0.12725067138671875, 0.1323394775390625, 0.13742828369140625, 0.14251708984375, 0.14760589599609375, 0.1526947021484375, 0.15778350830078125, 0.162872314453125, 0.16796112060546875, 0.1730499267578125, 0.17813873291015625, 0.1832275390625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 6.0, 1.0, 7.0, 5.0, 9.0, 9.0, 23.0, 27.0, 37.0, 36.0, 58.0, 94.0, 165.0, 272.0, 797.0, 2630.0, 13688.0, 134983.0, 774224.0, 106507.0, 11251.0, 2291.0, 707.0, 284.0, 152.0, 93.0, 54.0, 35.0, 34.0, 12.0, 20.0, 15.0, 10.0, 7.0, 5.0, 3.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.307861328125, -0.2974090576171875, -0.286956787109375, -0.2765045166015625, -0.26605224609375, -0.2555999755859375, -0.245147705078125, -0.2346954345703125, -0.2242431640625, -0.2137908935546875, -0.203338623046875, -0.1928863525390625, -0.18243408203125, -0.1719818115234375, -0.161529541015625, -0.1510772705078125, -0.140625, -0.1301727294921875, -0.119720458984375, -0.1092681884765625, -0.09881591796875, -0.0883636474609375, -0.077911376953125, -0.0674591064453125, -0.0570068359375, -0.0465545654296875, -0.036102294921875, -0.0256500244140625, -0.01519775390625, -0.0047454833984375, 0.005706787109375, 0.0161590576171875, 0.026611328125, 0.0370635986328125, 0.047515869140625, 0.0579681396484375, 0.06842041015625, 0.0788726806640625, 0.089324951171875, 0.0997772216796875, 0.1102294921875, 0.1206817626953125, 0.131134033203125, 0.1415863037109375, 0.15203857421875, 0.1624908447265625, 0.172943115234375, 0.1833953857421875, 0.19384765625, 0.2042999267578125, 0.214752197265625, 0.2252044677734375, 0.23565673828125, 0.2461090087890625, 0.256561279296875, 0.2670135498046875, 0.2774658203125, 0.2879180908203125, 0.298370361328125, 0.3088226318359375, 0.31927490234375, 0.3297271728515625, 0.340179443359375, 0.3506317138671875, 0.361083984375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 7.0, 8.0, 2.0, 6.0, 8.0, 15.0, 18.0, 13.0, 23.0, 32.0, 38.0, 50.0, 47.0, 51.0, 61.0, 64.0, 60.0, 67.0, 63.0, 54.0, 50.0, 57.0, 45.0, 31.0, 30.0, 24.0, 24.0, 10.0, 16.0, 8.0, 9.0, 5.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.6083984375, -0.5923042297363281, -0.5762100219726562, -0.5601158142089844, -0.5440216064453125, -0.5279273986816406, -0.5118331909179688, -0.4957389831542969, -0.479644775390625, -0.4635505676269531, -0.44745635986328125, -0.4313621520996094, -0.4152679443359375, -0.3991737365722656, -0.38307952880859375, -0.3669853210449219, -0.35089111328125, -0.3347969055175781, -0.31870269775390625, -0.3026084899902344, -0.2865142822265625, -0.2704200744628906, -0.25432586669921875, -0.23823165893554688, -0.222137451171875, -0.20604324340820312, -0.18994903564453125, -0.17385482788085938, -0.1577606201171875, -0.14166641235351562, -0.12557220458984375, -0.10947799682617188, -0.0933837890625, -0.07728958129882812, -0.06119537353515625, -0.045101165771484375, -0.0290069580078125, -0.012912750244140625, 0.00318145751953125, 0.019275665283203125, 0.035369873046875, 0.051464080810546875, 0.06755828857421875, 0.08365249633789062, 0.0997467041015625, 0.11584091186523438, 0.13193511962890625, 0.14802932739257812, 0.16412353515625, 0.18021774291992188, 0.19631195068359375, 0.21240615844726562, 0.2285003662109375, 0.24459457397460938, 0.26068878173828125, 0.2767829895019531, 0.292877197265625, 0.3089714050292969, 0.32506561279296875, 0.3411598205566406, 0.3572540283203125, 0.3733482360839844, 0.38944244384765625, 0.4055366516113281, 0.421630859375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 9.0, 9.0, 23.0, 27.0, 49.0, 108.0, 216.0, 465.0, 1297.0, 3594.0, 12631.0, 68362.0, 691539.0, 228927.0, 30385.0, 7082.0, 2299.0, 881.0, 331.0, 157.0, 69.0, 34.0, 23.0, 13.0, 12.0, 5.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1326904296875, -0.12851524353027344, -0.12434005737304688, -0.12016487121582031, -0.11598968505859375, -0.11181449890136719, -0.10763931274414062, -0.10346412658691406, -0.0992889404296875, -0.09511375427246094, -0.09093856811523438, -0.08676338195800781, -0.08258819580078125, -0.07841300964355469, -0.07423782348632812, -0.07006263732910156, -0.065887451171875, -0.06171226501464844, -0.057537078857421875, -0.05336189270019531, -0.04918670654296875, -0.04501152038574219, -0.040836334228515625, -0.03666114807128906, -0.0324859619140625, -0.028310775756835938, -0.024135589599609375, -0.019960403442382812, -0.01578521728515625, -0.011610031127929688, -0.007434844970703125, -0.0032596588134765625, 0.00091552734375, 0.0050907135009765625, 0.009265899658203125, 0.013441085815429688, 0.01761627197265625, 0.021791458129882812, 0.025966644287109375, 0.030141830444335938, 0.0343170166015625, 0.03849220275878906, 0.042667388916015625, 0.04684257507324219, 0.05101776123046875, 0.05519294738769531, 0.059368133544921875, 0.06354331970214844, 0.067718505859375, 0.07189369201660156, 0.07606887817382812, 0.08024406433105469, 0.08441925048828125, 0.08859443664550781, 0.09276962280273438, 0.09694480895996094, 0.1011199951171875, 0.10529518127441406, 0.10947036743164062, 0.11364555358886719, 0.11782073974609375, 0.12199592590332031, 0.12617111206054688, 0.13034629821777344, 0.134521484375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 0.0, 3.0, 4.0, 7.0, 5.0, 6.0, 11.0, 9.0, 17.0, 23.0, 26.0, 32.0, 43.0, 58.0, 75.0, 81.0, 87.0, 110.0, 88.0, 70.0, 60.0, 52.0, 44.0, 29.0, 13.0, 15.0, 12.0, 7.0, 5.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.112720489501953e-05, -3.980565816164017e-05, -3.84841114282608e-05, -3.716256469488144e-05, -3.5841017961502075e-05, -3.451947122812271e-05, -3.319792449474335e-05, -3.187637776136398e-05, -3.055483102798462e-05, -2.9233284294605255e-05, -2.791173756122589e-05, -2.6590190827846527e-05, -2.5268644094467163e-05, -2.39470973610878e-05, -2.2625550627708435e-05, -2.130400389432907e-05, -1.9982457160949707e-05, -1.8660910427570343e-05, -1.733936369419098e-05, -1.6017816960811615e-05, -1.4696270227432251e-05, -1.3374723494052887e-05, -1.2053176760673523e-05, -1.0731630027294159e-05, -9.410083293914795e-06, -8.088536560535431e-06, -6.766989827156067e-06, -5.445443093776703e-06, -4.123896360397339e-06, -2.802349627017975e-06, -1.4808028936386108e-06, -1.5925616025924683e-07, 1.1622905731201172e-06, 2.483837306499481e-06, 3.8053840398788452e-06, 5.126930773258209e-06, 6.448477506637573e-06, 7.770024240016937e-06, 9.091570973396301e-06, 1.0413117706775665e-05, 1.173466444015503e-05, 1.3056211173534393e-05, 1.4377757906913757e-05, 1.569930464029312e-05, 1.7020851373672485e-05, 1.834239810705185e-05, 1.9663944840431213e-05, 2.0985491573810577e-05, 2.230703830718994e-05, 2.3628585040569305e-05, 2.495013177394867e-05, 2.6271678507328033e-05, 2.7593225240707397e-05, 2.891477197408676e-05, 3.0236318707466125e-05, 3.155786544084549e-05, 3.2879412174224854e-05, 3.420095890760422e-05, 3.552250564098358e-05, 3.6844052374362946e-05, 3.816559910774231e-05, 3.9487145841121674e-05, 4.080869257450104e-05, 4.21302393078804e-05, 4.3451786041259766e-05]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 2.0, 4.0, 7.0, 11.0, 16.0, 14.0, 27.0, 37.0, 42.0, 87.0, 114.0, 193.0, 302.0, 539.0, 941.0, 1704.0, 3545.0, 7512.0, 18110.0, 53544.0, 193757.0, 569166.0, 134005.0, 38552.0, 14109.0, 5887.0, 2816.0, 1504.0, 778.0, 421.0, 268.0, 169.0, 93.0, 81.0, 45.0, 33.0, 34.0, 17.0, 19.0, 11.0, 12.0, 3.0, 8.0, 4.0, 1.0, 3.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.076416015625, -0.07381343841552734, -0.07121086120605469, -0.06860828399658203, -0.06600570678710938, -0.06340312957763672, -0.06080055236816406, -0.058197975158691406, -0.05559539794921875, -0.052992820739746094, -0.05039024353027344, -0.04778766632080078, -0.045185089111328125, -0.04258251190185547, -0.03997993469238281, -0.037377357482910156, -0.0347747802734375, -0.032172203063964844, -0.029569625854492188, -0.02696704864501953, -0.024364471435546875, -0.02176189422607422, -0.019159317016601562, -0.016556739807128906, -0.01395416259765625, -0.011351585388183594, -0.008749008178710938, -0.006146430969238281, -0.003543853759765625, -0.0009412765502929688, 0.0016613006591796875, 0.004263877868652344, 0.006866455078125, 0.009469032287597656, 0.012071609497070312, 0.014674186706542969, 0.017276763916015625, 0.01987934112548828, 0.022481918334960938, 0.025084495544433594, 0.02768707275390625, 0.030289649963378906, 0.03289222717285156, 0.03549480438232422, 0.038097381591796875, 0.04069995880126953, 0.04330253601074219, 0.045905113220214844, 0.0485076904296875, 0.051110267639160156, 0.05371284484863281, 0.05631542205810547, 0.058917999267578125, 0.06152057647705078, 0.06412315368652344, 0.0667257308959961, 0.06932830810546875, 0.0719308853149414, 0.07453346252441406, 0.07713603973388672, 0.07973861694335938, 0.08234119415283203, 0.08494377136230469, 0.08754634857177734, 0.09014892578125]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 6.0, 6.0, 13.0, 17.0, 24.0, 46.0, 58.0, 107.0, 139.0, 156.0, 147.0, 123.0, 58.0, 42.0, 36.0, 9.0, 11.0, 3.0, 3.0, 5.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.274169921875, -0.2684011459350586, -0.2626323699951172, -0.2568635940551758, -0.2510948181152344, -0.24532604217529297, -0.23955726623535156, -0.23378849029541016, -0.22801971435546875, -0.22225093841552734, -0.21648216247558594, -0.21071338653564453, -0.20494461059570312, -0.19917583465576172, -0.1934070587158203, -0.1876382827758789, -0.1818695068359375, -0.1761007308959961, -0.1703319549560547, -0.16456317901611328, -0.15879440307617188, -0.15302562713623047, -0.14725685119628906, -0.14148807525634766, -0.13571929931640625, -0.12995052337646484, -0.12418174743652344, -0.11841297149658203, -0.11264419555664062, -0.10687541961669922, -0.10110664367675781, -0.0953378677368164, -0.089569091796875, -0.0838003158569336, -0.07803153991699219, -0.07226276397705078, -0.06649398803710938, -0.06072521209716797, -0.05495643615722656, -0.049187660217285156, -0.04341888427734375, -0.037650108337402344, -0.03188133239746094, -0.02611255645751953, -0.020343780517578125, -0.014575004577636719, -0.008806228637695312, -0.0030374526977539062, 0.0027313232421875, 0.008500099182128906, 0.014268875122070312, 0.02003765106201172, 0.025806427001953125, 0.03157520294189453, 0.03734397888183594, 0.043112754821777344, 0.04888153076171875, 0.054650306701660156, 0.06041908264160156, 0.06618785858154297, 0.07195663452148438, 0.07772541046142578, 0.08349418640136719, 0.0892629623413086, 0.09503173828125]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 1.0, 3.0, 8.0, 13.0, 35.0, 98.0, 216.0, 363.0, 138.0, 68.0, 27.0, 10.0, 12.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.572631359100342, -4.467034339904785, -4.361437797546387, -4.25584077835083, -4.150243759155273, -4.044646739959717, -3.9390499591827393, -3.8334531784057617, -3.727856159210205, -3.6222591400146484, -3.516662359237671, -3.4110655784606934, -3.3054685592651367, -3.19987154006958, -3.0942747592926025, -2.988677978515625, -2.8830809593200684, -2.7774839401245117, -2.671887159347534, -2.5662903785705566, -2.460693359375, -2.3550963401794434, -2.249499559402466, -2.1439027786254883, -2.0383057594299316, -1.9327088594436646, -1.8271119594573975, -1.7215150594711304, -1.6159181594848633, -1.5103212594985962, -1.404724359512329, -1.299127459526062, -1.193530559539795, -1.0879336595535278, -0.9823367595672607, -0.8767398595809937, -0.7711429595947266, -0.6655460596084595, -0.5599491596221924, -0.4543522596359253, -0.3487553596496582, -0.2431584596633911, -0.13756155967712402, -0.031964659690856934, 0.07363224029541016, 0.17922914028167725, 0.28482604026794434, 0.3904229402542114, 0.4960198402404785, 0.6016167402267456, 0.7072136402130127, 0.8128105401992798, 0.9184074401855469, 1.024004340171814, 1.129601240158081, 1.2351981401443481, 1.3407950401306152, 1.4463919401168823, 1.5519888401031494, 1.6575857400894165, 1.7631826400756836, 1.8687795400619507, 1.9743764400482178, 2.0799732208251953, 2.185570240020752]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 5.0, 2.0, 2.0, 3.0, 9.0, 6.0, 8.0, 9.0, 9.0, 9.0, 13.0, 15.0, 20.0, 17.0, 21.0, 29.0, 28.0, 32.0, 39.0, 35.0, 44.0, 73.0, 68.0, 76.0, 70.0, 57.0, 36.0, 36.0, 31.0, 38.0, 32.0, 24.0, 17.0, 17.0, 16.0, 24.0, 10.0, 10.0, 5.0, 2.0, 4.0, 6.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5206475257873535, -1.469054937362671, -1.4174623489379883, -1.3658697605133057, -1.3142770528793335, -1.2626844644546509, -1.2110918760299683, -1.1594992876052856, -1.107906699180603, -1.0563141107559204, -1.0047215223312378, -0.9531288743019104, -0.9015362858772278, -0.8499436378479004, -0.7983510494232178, -0.7467584609985352, -0.6951658129692078, -0.6435732245445251, -0.5919805765151978, -0.5403879880905151, -0.4887953996658325, -0.4372027814388275, -0.3856101632118225, -0.3340175747871399, -0.2824249565601349, -0.23083235323429108, -0.17923974990844727, -0.12764713168144226, -0.07605452835559845, -0.02446192502975464, 0.027130693197250366, 0.07872328162193298, 0.130315899848938, 0.1819085031747818, 0.2335011065006256, 0.2850937247276306, 0.33668631315231323, 0.38827893137931824, 0.43987154960632324, 0.49146413803100586, 0.5430567264556885, 0.5946493148803711, 0.6462419629096985, 0.6978345513343811, 0.7494271397590637, 0.8010197877883911, 0.8526123762130737, 0.9042049646377563, 0.9557976126670837, 1.0073902606964111, 1.0589828491210938, 1.1105754375457764, 1.162168025970459, 1.2137606143951416, 1.2653532028198242, 1.3169457912445068, 1.368538498878479, 1.4201310873031616, 1.4717236757278442, 1.5233163833618164, 1.574908971786499, 1.6265015602111816, 1.6780941486358643, 1.7296867370605469, 1.7812793254852295]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 1.0, 4.0, 4.0, 12.0, 11.0, 18.0, 39.0, 43.0, 71.0, 158.0, 262.0, 479.0, 950.0, 2357.0, 7320.0, 35959.0, 498633.0, 3269213.0, 342220.0, 26948.0, 5647.0, 2049.0, 851.0, 429.0, 251.0, 138.0, 71.0, 43.0, 37.0, 19.0, 19.0, 4.0, 4.0, 4.0, 3.0, 3.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1619873046875, -0.15535926818847656, -0.14873123168945312, -0.1421031951904297, -0.13547515869140625, -0.1288471221923828, -0.12221908569335938, -0.11559104919433594, -0.1089630126953125, -0.10233497619628906, -0.09570693969726562, -0.08907890319824219, -0.08245086669921875, -0.07582283020019531, -0.06919479370117188, -0.06256675720214844, -0.055938720703125, -0.04931068420410156, -0.042682647705078125, -0.03605461120605469, -0.02942657470703125, -0.022798538208007812, -0.016170501708984375, -0.009542465209960938, -0.0029144287109375, 0.0037136077880859375, 0.010341644287109375, 0.016969680786132812, 0.02359771728515625, 0.030225753784179688, 0.036853790283203125, 0.04348182678222656, 0.05010986328125, 0.05673789978027344, 0.06336593627929688, 0.06999397277832031, 0.07662200927734375, 0.08325004577636719, 0.08987808227539062, 0.09650611877441406, 0.1031341552734375, 0.10976219177246094, 0.11639022827148438, 0.12301826477050781, 0.12964630126953125, 0.1362743377685547, 0.14290237426757812, 0.14953041076660156, 0.156158447265625, 0.16278648376464844, 0.16941452026367188, 0.1760425567626953, 0.18267059326171875, 0.1892986297607422, 0.19592666625976562, 0.20255470275878906, 0.2091827392578125, 0.21581077575683594, 0.22243881225585938, 0.2290668487548828, 0.23569488525390625, 0.2423229217529297, 0.24895095825195312, 0.25557899475097656, 0.26220703125]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 2.0, 5.0, 9.0, 12.0, 11.0, 22.0, 43.0, 31.0, 52.0, 58.0, 71.0, 69.0, 66.0, 81.0, 73.0, 76.0, 59.0, 53.0, 50.0, 48.0, 35.0, 21.0, 14.0, 5.0, 12.0, 6.0, 6.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1458740234375, -0.1405773162841797, -0.13528060913085938, -0.12998390197753906, -0.12468719482421875, -0.11939048767089844, -0.11409378051757812, -0.10879707336425781, -0.1035003662109375, -0.09820365905761719, -0.09290695190429688, -0.08761024475097656, -0.08231353759765625, -0.07701683044433594, -0.07172012329101562, -0.06642341613769531, -0.061126708984375, -0.05583000183105469, -0.050533294677734375, -0.04523658752441406, -0.03993988037109375, -0.03464317321777344, -0.029346466064453125, -0.024049758911132812, -0.0187530517578125, -0.013456344604492188, -0.008159637451171875, -0.0028629302978515625, 0.00243377685546875, 0.0077304840087890625, 0.013027191162109375, 0.018323898315429688, 0.02362060546875, 0.028917312622070312, 0.034214019775390625, 0.03951072692871094, 0.04480743408203125, 0.05010414123535156, 0.055400848388671875, 0.06069755554199219, 0.0659942626953125, 0.07129096984863281, 0.07658767700195312, 0.08188438415527344, 0.08718109130859375, 0.09247779846191406, 0.09777450561523438, 0.10307121276855469, 0.108367919921875, 0.11366462707519531, 0.11896133422851562, 0.12425804138183594, 0.12955474853515625, 0.13485145568847656, 0.14014816284179688, 0.1454448699951172, 0.1507415771484375, 0.1560382843017578, 0.16133499145507812, 0.16663169860839844, 0.17192840576171875, 0.17722511291503906, 0.18252182006835938, 0.1878185272216797, 0.193115234375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 5.0, 2.0, 11.0, 24.0, 47.0, 68.0, 184.0, 430.0, 1618.0, 40316.0, 4125828.0, 23565.0, 1413.0, 456.0, 167.0, 83.0, 29.0, 15.0, 11.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.74072265625, -0.7163925170898438, -0.6920623779296875, -0.6677322387695312, -0.643402099609375, -0.6190719604492188, -0.5947418212890625, -0.5704116821289062, -0.54608154296875, -0.5217514038085938, -0.4974212646484375, -0.47309112548828125, -0.448760986328125, -0.42443084716796875, -0.4001007080078125, -0.37577056884765625, -0.3514404296875, -0.32711029052734375, -0.3027801513671875, -0.27845001220703125, -0.254119873046875, -0.22978973388671875, -0.2054595947265625, -0.18112945556640625, -0.15679931640625, -0.13246917724609375, -0.1081390380859375, -0.08380889892578125, -0.059478759765625, -0.03514862060546875, -0.0108184814453125, 0.01351165771484375, 0.037841796875, 0.06217193603515625, 0.0865020751953125, 0.11083221435546875, 0.135162353515625, 0.15949249267578125, 0.1838226318359375, 0.20815277099609375, 0.23248291015625, 0.25681304931640625, 0.2811431884765625, 0.30547332763671875, 0.329803466796875, 0.35413360595703125, 0.3784637451171875, 0.40279388427734375, 0.4271240234375, 0.45145416259765625, 0.4757843017578125, 0.5001144409179688, 0.524444580078125, 0.5487747192382812, 0.5731048583984375, 0.5974349975585938, 0.62176513671875, 0.6460952758789062, 0.6704254150390625, 0.6947555541992188, 0.719085693359375, 0.7434158325195312, 0.7677459716796875, 0.7920761108398438, 0.81640625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 8.0, 2.0, 3.0, 4.0, 3.0, 10.0, 23.0, 25.0, 35.0, 52.0, 96.0, 177.0, 385.0, 684.0, 886.0, 778.0, 386.0, 215.0, 126.0, 60.0, 44.0, 26.0, 13.0, 10.0, 15.0, 6.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.29541015625, -0.2868804931640625, -0.278350830078125, -0.2698211669921875, -0.26129150390625, -0.2527618408203125, -0.244232177734375, -0.2357025146484375, -0.2271728515625, -0.2186431884765625, -0.210113525390625, -0.2015838623046875, -0.19305419921875, -0.1845245361328125, -0.175994873046875, -0.1674652099609375, -0.158935546875, -0.1504058837890625, -0.141876220703125, -0.1333465576171875, -0.12481689453125, -0.1162872314453125, -0.107757568359375, -0.0992279052734375, -0.0906982421875, -0.0821685791015625, -0.073638916015625, -0.0651092529296875, -0.05657958984375, -0.0480499267578125, -0.039520263671875, -0.0309906005859375, -0.0224609375, -0.0139312744140625, -0.005401611328125, 0.0031280517578125, 0.01165771484375, 0.0201873779296875, 0.028717041015625, 0.0372467041015625, 0.0457763671875, 0.0543060302734375, 0.062835693359375, 0.0713653564453125, 0.07989501953125, 0.0884246826171875, 0.096954345703125, 0.1054840087890625, 0.114013671875, 0.1225433349609375, 0.131072998046875, 0.1396026611328125, 0.14813232421875, 0.1566619873046875, 0.165191650390625, 0.1737213134765625, 0.1822509765625, 0.1907806396484375, 0.199310302734375, 0.2078399658203125, 0.21636962890625, 0.2248992919921875, 0.233428955078125, 0.2419586181640625, 0.25048828125]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 0.0, 4.0, 11.0, 18.0, 51.0, 83.0, 187.0, 253.0, 162.0, 118.0, 55.0, 30.0, 19.0, 7.0, 1.0, 0.0, 8.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.142481565475464, -3.0541329383850098, -2.9657845497131348, -2.8774359226226807, -2.7890872955322266, -2.7007386684417725, -2.6123902797698975, -2.5240416526794434, -2.4356930255889893, -2.347344398498535, -2.25899600982666, -2.170647382736206, -2.082298755645752, -1.9939502477645874, -1.9056017398834229, -1.8172531127929688, -1.7289046049118042, -1.6405560970306396, -1.5522074699401855, -1.463858962059021, -1.375510334968567, -1.2871618270874023, -1.1988131999969482, -1.1104646921157837, -1.0221161842346191, -0.9337676167488098, -0.8454190492630005, -0.7570705413818359, -0.6687219142913818, -0.5803734064102173, -0.49202483892440796, -0.40367627143859863, -0.31532764434814453, -0.2269790768623352, -0.13863052427768707, -0.05028197169303894, 0.038066595792770386, 0.1264151632785797, 0.21476370096206665, 0.303112268447876, 0.3914608359336853, 0.47980940341949463, 0.568157970905304, 0.6565065383911133, 0.7448550462722778, 0.8332036733627319, 0.9215521812438965, 1.0099008083343506, 1.0982493162155151, 1.1865978240966797, 1.2749464511871338, 1.3632949590682983, 1.4516435861587524, 1.539992094039917, 1.628340721130371, 1.7166892290115356, 1.8050377368927002, 1.8933862447738647, 1.9817348718643188, 2.0700833797454834, 2.1584320068359375, 2.2467806339263916, 2.3351290225982666, 2.4234776496887207, 2.511826276779175]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 4.0, 3.0, 3.0, 3.0, 11.0, 7.0, 11.0, 4.0, 11.0, 17.0, 12.0, 22.0, 19.0, 23.0, 22.0, 25.0, 35.0, 36.0, 29.0, 39.0, 35.0, 47.0, 49.0, 60.0, 50.0, 40.0, 46.0, 44.0, 39.0, 38.0, 30.0, 30.0, 30.0, 24.0, 16.0, 19.0, 10.0, 16.0, 8.0, 13.0, 2.0, 4.0, 9.0, 10.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6873423457145691, -0.661778450012207, -0.6362144947052002, -0.6106505990028381, -0.5850867033004761, -0.5595227479934692, -0.5339588522911072, -0.5083949565887451, -0.4828310012817383, -0.45726707577705383, -0.4317031800746918, -0.4061392545700073, -0.3805753290653229, -0.3550114035606384, -0.32944750785827637, -0.3038835823535919, -0.27831968665122986, -0.2527557611465454, -0.22719185054302216, -0.2016279399394989, -0.17606401443481445, -0.1505001038312912, -0.12493619322776794, -0.0993722677230835, -0.07380835711956024, -0.04824443906545639, -0.022680524736642838, 0.0028833895921707153, 0.028447307646274567, 0.05401122570037842, 0.07957513630390167, 0.10513906180858612, 0.13070297241210938, 0.15626688301563263, 0.18183080852031708, 0.20739471912384033, 0.23295864462852478, 0.25852257013320923, 0.2840864658355713, 0.30965039134025574, 0.3352143168449402, 0.36077824234962463, 0.3863421380519867, 0.41190606355667114, 0.4374699890613556, 0.46303391456604004, 0.4885978102684021, 0.5141617059707642, 0.539725661277771, 0.5652895569801331, 0.5908535122871399, 0.616417407989502, 0.641981303691864, 0.6675452589988708, 0.6931091547012329, 0.7186731100082397, 0.744236946105957, 0.7698008418083191, 0.7953647971153259, 0.820928692817688, 0.84649258852005, 0.8720565438270569, 0.897620439529419, 0.9231843948364258, 0.9487482905387878]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 6.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 7.0, 7.0, 15.0, 21.0, 31.0, 45.0, 80.0, 124.0, 252.0, 491.0, 1111.0, 2965.0, 9557.0, 41179.0, 254261.0, 588352.0, 118298.0, 22225.0, 5918.0, 1974.0, 791.0, 375.0, 182.0, 115.0, 64.0, 41.0, 20.0, 15.0, 9.0, 6.0, 7.0, 6.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.181884765625, -0.17440032958984375, -0.1669158935546875, -0.15943145751953125, -0.151947021484375, -0.14446258544921875, -0.1369781494140625, -0.12949371337890625, -0.12200927734375, -0.11452484130859375, -0.1070404052734375, -0.09955596923828125, -0.092071533203125, -0.08458709716796875, -0.0771026611328125, -0.06961822509765625, -0.0621337890625, -0.05464935302734375, -0.0471649169921875, -0.03968048095703125, -0.032196044921875, -0.02471160888671875, -0.0172271728515625, -0.00974273681640625, -0.00225830078125, 0.00522613525390625, 0.0127105712890625, 0.02019500732421875, 0.027679443359375, 0.03516387939453125, 0.0426483154296875, 0.05013275146484375, 0.0576171875, 0.06510162353515625, 0.0725860595703125, 0.08007049560546875, 0.087554931640625, 0.09503936767578125, 0.1025238037109375, 0.11000823974609375, 0.11749267578125, 0.12497711181640625, 0.1324615478515625, 0.13994598388671875, 0.147430419921875, 0.15491485595703125, 0.1623992919921875, 0.16988372802734375, 0.1773681640625, 0.18485260009765625, 0.1923370361328125, 0.19982147216796875, 0.207305908203125, 0.21479034423828125, 0.2222747802734375, 0.22975921630859375, 0.23724365234375, 0.24472808837890625, 0.2522125244140625, 0.25969696044921875, 0.267181396484375, 0.27466583251953125, 0.2821502685546875, 0.28963470458984375, 0.297119140625]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 6.0, 5.0, 4.0, 14.0, 12.0, 9.0, 20.0, 21.0, 28.0, 41.0, 41.0, 57.0, 55.0, 59.0, 66.0, 69.0, 62.0, 69.0, 63.0, 59.0, 47.0, 52.0, 34.0, 31.0, 18.0, 25.0, 9.0, 8.0, 5.0, 6.0, 4.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.132568359375, -0.12762069702148438, -0.12267303466796875, -0.11772537231445312, -0.1127777099609375, -0.10783004760742188, -0.10288238525390625, -0.09793472290039062, -0.092987060546875, -0.08803939819335938, -0.08309173583984375, -0.07814407348632812, -0.0731964111328125, -0.06824874877929688, -0.06330108642578125, -0.058353424072265625, -0.05340576171875, -0.048458099365234375, -0.04351043701171875, -0.038562774658203125, -0.0336151123046875, -0.028667449951171875, -0.02371978759765625, -0.018772125244140625, -0.013824462890625, -0.008876800537109375, -0.00392913818359375, 0.001018524169921875, 0.0059661865234375, 0.010913848876953125, 0.01586151123046875, 0.020809173583984375, 0.0257568359375, 0.030704498291015625, 0.03565216064453125, 0.040599822998046875, 0.0455474853515625, 0.050495147705078125, 0.05544281005859375, 0.060390472412109375, 0.065338134765625, 0.07028579711914062, 0.07523345947265625, 0.08018112182617188, 0.0851287841796875, 0.09007644653320312, 0.09502410888671875, 0.09997177124023438, 0.10491943359375, 0.10986709594726562, 0.11481475830078125, 0.11976242065429688, 0.1247100830078125, 0.12965774536132812, 0.13460540771484375, 0.13955307006835938, 0.144500732421875, 0.14944839477539062, 0.15439605712890625, 0.15934371948242188, 0.1642913818359375, 0.16923904418945312, 0.17418670654296875, 0.17913436889648438, 0.18408203125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 6.0, 7.0, 6.0, 4.0, 4.0, 17.0, 14.0, 31.0, 33.0, 50.0, 87.0, 129.0, 203.0, 362.0, 681.0, 1679.0, 5252.0, 27671.0, 307119.0, 654078.0, 40518.0, 6792.0, 1957.0, 854.0, 383.0, 226.0, 132.0, 80.0, 61.0, 30.0, 25.0, 17.0, 20.0, 9.0, 6.0, 6.0, 4.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.29541015625, -0.28525543212890625, -0.2751007080078125, -0.26494598388671875, -0.254791259765625, -0.24463653564453125, -0.2344818115234375, -0.22432708740234375, -0.21417236328125, -0.20401763916015625, -0.1938629150390625, -0.18370819091796875, -0.173553466796875, -0.16339874267578125, -0.1532440185546875, -0.14308929443359375, -0.1329345703125, -0.12277984619140625, -0.1126251220703125, -0.10247039794921875, -0.092315673828125, -0.08216094970703125, -0.0720062255859375, -0.06185150146484375, -0.05169677734375, -0.04154205322265625, -0.0313873291015625, -0.02123260498046875, -0.011077880859375, -0.00092315673828125, 0.0092315673828125, 0.01938629150390625, 0.029541015625, 0.03969573974609375, 0.0498504638671875, 0.06000518798828125, 0.070159912109375, 0.08031463623046875, 0.0904693603515625, 0.10062408447265625, 0.11077880859375, 0.12093353271484375, 0.1310882568359375, 0.14124298095703125, 0.151397705078125, 0.16155242919921875, 0.1717071533203125, 0.18186187744140625, 0.1920166015625, 0.20217132568359375, 0.2123260498046875, 0.22248077392578125, 0.232635498046875, 0.24279022216796875, 0.2529449462890625, 0.26309967041015625, 0.27325439453125, 0.28340911865234375, 0.2935638427734375, 0.30371856689453125, 0.313873291015625, 0.32402801513671875, 0.3341827392578125, 0.34433746337890625, 0.3544921875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 5.0, 4.0, 8.0, 8.0, 10.0, 20.0, 17.0, 25.0, 25.0, 23.0, 20.0, 39.0, 47.0, 55.0, 50.0, 50.0, 50.0, 49.0, 56.0, 52.0, 33.0, 38.0, 48.0, 45.0, 33.0, 34.0, 31.0, 22.0, 20.0, 16.0, 18.0, 7.0, 6.0, 10.0, 7.0, 4.0, 5.0, 3.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.395263671875, -0.38181304931640625, -0.3683624267578125, -0.35491180419921875, -0.341461181640625, -0.32801055908203125, -0.3145599365234375, -0.30110931396484375, -0.28765869140625, -0.27420806884765625, -0.2607574462890625, -0.24730682373046875, -0.233856201171875, -0.22040557861328125, -0.2069549560546875, -0.19350433349609375, -0.1800537109375, -0.16660308837890625, -0.1531524658203125, -0.13970184326171875, -0.126251220703125, -0.11280059814453125, -0.0993499755859375, -0.08589935302734375, -0.07244873046875, -0.05899810791015625, -0.0455474853515625, -0.03209686279296875, -0.018646240234375, -0.00519561767578125, 0.0082550048828125, 0.02170562744140625, 0.03515625, 0.04860687255859375, 0.0620574951171875, 0.07550811767578125, 0.088958740234375, 0.10240936279296875, 0.1158599853515625, 0.12931060791015625, 0.14276123046875, 0.15621185302734375, 0.1696624755859375, 0.18311309814453125, 0.196563720703125, 0.21001434326171875, 0.2234649658203125, 0.23691558837890625, 0.2503662109375, 0.26381683349609375, 0.2772674560546875, 0.29071807861328125, 0.304168701171875, 0.31761932373046875, 0.3310699462890625, 0.34452056884765625, 0.35797119140625, 0.37142181396484375, 0.3848724365234375, 0.39832305908203125, 0.411773681640625, 0.42522430419921875, 0.4386749267578125, 0.45212554931640625, 0.465576171875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 0.0, 8.0, 2.0, 12.0, 11.0, 9.0, 24.0, 35.0, 34.0, 64.0, 119.0, 162.0, 291.0, 515.0, 875.0, 1654.0, 3484.0, 7712.0, 18637.0, 53515.0, 237853.0, 603765.0, 76444.0, 24722.0, 9591.0, 4299.0, 2098.0, 1105.0, 610.0, 331.0, 215.0, 110.0, 72.0, 64.0, 35.0, 22.0, 19.0, 8.0, 9.0, 11.0, 1.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.08758544921875, -0.08502006530761719, -0.08245468139648438, -0.07988929748535156, -0.07732391357421875, -0.07475852966308594, -0.07219314575195312, -0.06962776184082031, -0.0670623779296875, -0.06449699401855469, -0.061931610107421875, -0.05936622619628906, -0.05680084228515625, -0.05423545837402344, -0.051670074462890625, -0.04910469055175781, -0.046539306640625, -0.04397392272949219, -0.041408538818359375, -0.03884315490722656, -0.03627777099609375, -0.03371238708496094, -0.031147003173828125, -0.028581619262695312, -0.0260162353515625, -0.023450851440429688, -0.020885467529296875, -0.018320083618164062, -0.01575469970703125, -0.013189315795898438, -0.010623931884765625, -0.008058547973632812, -0.0054931640625, -0.0029277801513671875, -0.000362396240234375, 0.0022029876708984375, 0.00476837158203125, 0.0073337554931640625, 0.009899139404296875, 0.012464523315429688, 0.0150299072265625, 0.017595291137695312, 0.020160675048828125, 0.022726058959960938, 0.02529144287109375, 0.027856826782226562, 0.030422210693359375, 0.03298759460449219, 0.035552978515625, 0.03811836242675781, 0.040683746337890625, 0.04324913024902344, 0.04581451416015625, 0.04837989807128906, 0.050945281982421875, 0.05351066589355469, 0.0560760498046875, 0.05864143371582031, 0.061206817626953125, 0.06377220153808594, 0.06633758544921875, 0.06890296936035156, 0.07146835327148438, 0.07403373718261719, 0.07659912109375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 7.0, 3.0, 2.0, 8.0, 10.0, 3.0, 20.0, 17.0, 23.0, 25.0, 40.0, 37.0, 70.0, 106.0, 117.0, 109.0, 85.0, 85.0, 64.0, 44.0, 33.0, 15.0, 20.0, 12.0, 12.0, 11.0, 7.0, 6.0, 5.0, 4.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.8220157623291016e-05, -4.680640995502472e-05, -4.539266228675842e-05, -4.3978914618492126e-05, -4.256516695022583e-05, -4.1151419281959534e-05, -3.973767161369324e-05, -3.832392394542694e-05, -3.6910176277160645e-05, -3.549642860889435e-05, -3.408268094062805e-05, -3.2668933272361755e-05, -3.125518560409546e-05, -2.9841437935829163e-05, -2.8427690267562866e-05, -2.701394259929657e-05, -2.5600194931030273e-05, -2.4186447262763977e-05, -2.277269959449768e-05, -2.1358951926231384e-05, -1.9945204257965088e-05, -1.853145658969879e-05, -1.7117708921432495e-05, -1.57039612531662e-05, -1.4290213584899902e-05, -1.2876465916633606e-05, -1.146271824836731e-05, -1.0048970580101013e-05, -8.635222911834717e-06, -7.22147524356842e-06, -5.807727575302124e-06, -4.393979907035828e-06, -2.9802322387695312e-06, -1.5664845705032349e-06, -1.5273690223693848e-07, 1.261010766029358e-06, 2.6747584342956543e-06, 4.088506102561951e-06, 5.502253770828247e-06, 6.9160014390945435e-06, 8.32974910736084e-06, 9.743496775627136e-06, 1.1157244443893433e-05, 1.2570992112159729e-05, 1.3984739780426025e-05, 1.5398487448692322e-05, 1.6812235116958618e-05, 1.8225982785224915e-05, 1.963973045349121e-05, 2.1053478121757507e-05, 2.2467225790023804e-05, 2.38809734582901e-05, 2.5294721126556396e-05, 2.6708468794822693e-05, 2.812221646308899e-05, 2.9535964131355286e-05, 3.094971179962158e-05, 3.236345946788788e-05, 3.3777207136154175e-05, 3.519095480442047e-05, 3.660470247268677e-05, 3.8018450140953064e-05, 3.943219780921936e-05, 4.084594547748566e-05, 4.225969314575195e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 1.0, 2.0, 13.0, 10.0, 10.0, 17.0, 25.0, 46.0, 71.0, 134.0, 250.0, 490.0, 1155.0, 3317.0, 11096.0, 48220.0, 607503.0, 320029.0, 41232.0, 9797.0, 3003.0, 1087.0, 459.0, 241.0, 149.0, 66.0, 48.0, 39.0, 17.0, 9.0, 8.0, 9.0, 6.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0882568359375, -0.08441162109375, -0.08056640625, -0.07672119140625, -0.0728759765625, -0.06903076171875, -0.065185546875, -0.06134033203125, -0.0574951171875, -0.05364990234375, -0.0498046875, -0.04595947265625, -0.0421142578125, -0.03826904296875, -0.034423828125, -0.03057861328125, -0.0267333984375, -0.02288818359375, -0.01904296875, -0.01519775390625, -0.0113525390625, -0.00750732421875, -0.003662109375, 0.00018310546875, 0.0040283203125, 0.00787353515625, 0.01171875, 0.01556396484375, 0.0194091796875, 0.02325439453125, 0.027099609375, 0.03094482421875, 0.0347900390625, 0.03863525390625, 0.04248046875, 0.04632568359375, 0.0501708984375, 0.05401611328125, 0.057861328125, 0.06170654296875, 0.0655517578125, 0.06939697265625, 0.0732421875, 0.07708740234375, 0.0809326171875, 0.08477783203125, 0.088623046875, 0.09246826171875, 0.0963134765625, 0.10015869140625, 0.10400390625, 0.10784912109375, 0.1116943359375, 0.11553955078125, 0.119384765625, 0.12322998046875, 0.1270751953125, 0.13092041015625, 0.134765625, 0.13861083984375, 0.1424560546875, 0.14630126953125, 0.150146484375, 0.15399169921875, 0.1578369140625]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 7.0, 5.0, 7.0, 6.0, 12.0, 8.0, 16.0, 17.0, 22.0, 29.0, 29.0, 36.0, 78.0, 66.0, 107.0, 136.0, 90.0, 85.0, 60.0, 39.0, 26.0, 23.0, 19.0, 12.0, 13.0, 10.0, 11.0, 8.0, 8.0, 3.0, 7.0, 3.0, 3.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09527587890625, -0.09215068817138672, -0.08902549743652344, -0.08590030670166016, -0.08277511596679688, -0.0796499252319336, -0.07652473449707031, -0.07339954376220703, -0.07027435302734375, -0.06714916229248047, -0.06402397155761719, -0.060898780822753906, -0.057773590087890625, -0.054648399353027344, -0.05152320861816406, -0.04839801788330078, -0.0452728271484375, -0.04214763641357422, -0.03902244567871094, -0.035897254943847656, -0.032772064208984375, -0.029646873474121094, -0.026521682739257812, -0.02339649200439453, -0.02027130126953125, -0.01714611053466797, -0.014020919799804688, -0.010895729064941406, -0.007770538330078125, -0.004645347595214844, -0.0015201568603515625, 0.0016050338745117188, 0.004730224609375, 0.007855415344238281, 0.010980606079101562, 0.014105796813964844, 0.017230987548828125, 0.020356178283691406, 0.023481369018554688, 0.02660655975341797, 0.02973175048828125, 0.03285694122314453, 0.03598213195800781, 0.039107322692871094, 0.042232513427734375, 0.045357704162597656, 0.04848289489746094, 0.05160808563232422, 0.0547332763671875, 0.05785846710205078, 0.06098365783691406, 0.06410884857177734, 0.06723403930664062, 0.0703592300415039, 0.07348442077636719, 0.07660961151123047, 0.07973480224609375, 0.08285999298095703, 0.08598518371582031, 0.0891103744506836, 0.09223556518554688, 0.09536075592041016, 0.09848594665527344, 0.10161113739013672, 0.104736328125]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 3.0, 2.0, 3.0, 1.0, 3.0, 7.0, 7.0, 9.0, 25.0, 33.0, 85.0, 123.0, 246.0, 238.0, 99.0, 49.0, 36.0, 12.0, 5.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5853729248046875, -2.5114989280700684, -2.4376251697540283, -2.363751173019409, -2.28987717628479, -2.21600341796875, -2.142129421234131, -2.0682554244995117, -1.9943815469741821, -1.9205076694488525, -1.8466336727142334, -1.7727597951889038, -1.6988859176635742, -1.625011920928955, -1.5511380434036255, -1.477264165878296, -1.4033901691436768, -1.3295162916183472, -1.255642294883728, -1.1817684173583984, -1.1078944206237793, -1.0340205430984497, -0.9601466655731201, -0.8862727284431458, -0.8123987913131714, -0.738524854183197, -0.6646509170532227, -0.5907770395278931, -0.5169031023979187, -0.44302916526794434, -0.36915525794029236, -0.2952813506126404, -0.22140741348266602, -0.14753349125385284, -0.07365956902503967, 0.00021435320377349854, 0.07408827543258667, 0.14796221256256104, 0.221836119890213, 0.295710027217865, 0.36958396434783936, 0.4434579014778137, 0.5173318386077881, 0.5912057161331177, 0.665079653263092, 0.7389535903930664, 0.812827467918396, 0.8867014050483704, 0.9605753421783447, 1.0344492197036743, 1.1083232164382935, 1.182197093963623, 1.2560710906982422, 1.3299449682235718, 1.4038188457489014, 1.4776928424835205, 1.55156672000885, 1.6254405975341797, 1.6993145942687988, 1.7731884717941284, 1.847062349319458, 1.9209363460540771, 1.9948102235794067, 2.0686841011047363, 2.1425580978393555]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 2.0, 4.0, 2.0, 3.0, 3.0, 9.0, 13.0, 7.0, 15.0, 16.0, 24.0, 17.0, 23.0, 33.0, 27.0, 37.0, 26.0, 26.0, 41.0, 64.0, 83.0, 106.0, 85.0, 50.0, 39.0, 32.0, 37.0, 28.0, 26.0, 22.0, 15.0, 17.0, 10.0, 6.0, 9.0, 9.0, 10.0, 13.0, 9.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6635791063308716, -1.611914038658142, -1.5602489709854126, -1.508583903312683, -1.4569188356399536, -1.4052537679672241, -1.3535887002944946, -1.3019236326217651, -1.2502585649490356, -1.1985934972763062, -1.1469284296035767, -1.0952633619308472, -1.0435982942581177, -0.9919332265853882, -0.9402681589126587, -0.8886030912399292, -0.8369379639625549, -0.7852728962898254, -0.733607828617096, -0.6819427609443665, -0.630277693271637, -0.5786125659942627, -0.5269474983215332, -0.4752824604511261, -0.4236173927783966, -0.3719523251056671, -0.3202872574329376, -0.26862215995788574, -0.21695710718631744, -0.16529202461242676, -0.11362695693969727, -0.06196188926696777, -0.010296821594238281, 0.04136824980378151, 0.0930333212018013, 0.1446983963251114, 0.19636346399784088, 0.24802854657173157, 0.29969361424446106, 0.35135868191719055, 0.40302374958992004, 0.45468881726264954, 0.5063539147377014, 0.5580189824104309, 0.6096840500831604, 0.6613491177558899, 0.7130141854286194, 0.7646792531013489, 0.8163443207740784, 0.8680093884468079, 0.9196744561195374, 0.9713395237922668, 1.0230046510696411, 1.0746697187423706, 1.1263347864151, 1.1779998540878296, 1.229664921760559, 1.2813299894332886, 1.332995057106018, 1.3846601247787476, 1.436325192451477, 1.4879902601242065, 1.539655327796936, 1.5913203954696655, 1.642985463142395]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 9.0, 11.0, 14.0, 21.0, 49.0, 107.0, 188.0, 383.0, 959.0, 2745.0, 10553.0, 65821.0, 1317007.0, 2630953.0, 143338.0, 15493.0, 4002.0, 1477.0, 595.0, 238.0, 128.0, 70.0, 35.0, 21.0, 16.0, 14.0, 9.0, 5.0, 8.0, 6.0, 5.0, 3.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.176513671875, -0.1692047119140625, -0.161895751953125, -0.1545867919921875, -0.14727783203125, -0.1399688720703125, -0.132659912109375, -0.1253509521484375, -0.1180419921875, -0.1107330322265625, -0.103424072265625, -0.0961151123046875, -0.08880615234375, -0.0814971923828125, -0.074188232421875, -0.0668792724609375, -0.0595703125, -0.0522613525390625, -0.044952392578125, -0.0376434326171875, -0.03033447265625, -0.0230255126953125, -0.015716552734375, -0.0084075927734375, -0.0010986328125, 0.0062103271484375, 0.013519287109375, 0.0208282470703125, 0.02813720703125, 0.0354461669921875, 0.042755126953125, 0.0500640869140625, 0.057373046875, 0.0646820068359375, 0.071990966796875, 0.0792999267578125, 0.08660888671875, 0.0939178466796875, 0.101226806640625, 0.1085357666015625, 0.1158447265625, 0.1231536865234375, 0.130462646484375, 0.1377716064453125, 0.14508056640625, 0.1523895263671875, 0.159698486328125, 0.1670074462890625, 0.17431640625, 0.1816253662109375, 0.188934326171875, 0.1962432861328125, 0.20355224609375, 0.2108612060546875, 0.218170166015625, 0.2254791259765625, 0.2327880859375, 0.2400970458984375, 0.247406005859375, 0.2547149658203125, 0.26202392578125, 0.2693328857421875, 0.276641845703125, 0.2839508056640625, 0.291259765625]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 5.0, 6.0, 8.0, 5.0, 6.0, 13.0, 14.0, 20.0, 30.0, 46.0, 46.0, 40.0, 67.0, 71.0, 66.0, 72.0, 64.0, 61.0, 67.0, 51.0, 50.0, 46.0, 42.0, 38.0, 22.0, 12.0, 10.0, 9.0, 8.0, 4.0, 4.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1400146484375, -0.13480186462402344, -0.12958908081054688, -0.12437629699707031, -0.11916351318359375, -0.11395072937011719, -0.10873794555664062, -0.10352516174316406, -0.0983123779296875, -0.09309959411621094, -0.08788681030273438, -0.08267402648925781, -0.07746124267578125, -0.07224845886230469, -0.06703567504882812, -0.06182289123535156, -0.056610107421875, -0.05139732360839844, -0.046184539794921875, -0.04097175598144531, -0.03575897216796875, -0.030546188354492188, -0.025333404541015625, -0.020120620727539062, -0.0149078369140625, -0.009695053100585938, -0.004482269287109375, 0.0007305145263671875, 0.00594329833984375, 0.011156082153320312, 0.016368865966796875, 0.021581649780273438, 0.02679443359375, 0.03200721740722656, 0.037220001220703125, 0.04243278503417969, 0.04764556884765625, 0.05285835266113281, 0.058071136474609375, 0.06328392028808594, 0.0684967041015625, 0.07370948791503906, 0.07892227172851562, 0.08413505554199219, 0.08934783935546875, 0.09456062316894531, 0.09977340698242188, 0.10498619079589844, 0.110198974609375, 0.11541175842285156, 0.12062454223632812, 0.1258373260498047, 0.13105010986328125, 0.1362628936767578, 0.14147567749023438, 0.14668846130371094, 0.1519012451171875, 0.15711402893066406, 0.16232681274414062, 0.1675395965576172, 0.17275238037109375, 0.1779651641845703, 0.18317794799804688, 0.18839073181152344, 0.193603515625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 5.0, 3.0, 7.0, 6.0, 15.0, 17.0, 32.0, 56.0, 122.0, 238.0, 564.0, 1816.0, 9665.0, 198325.0, 3904288.0, 71395.0, 5576.0, 1256.0, 434.0, 224.0, 96.0, 51.0, 40.0, 19.0, 8.0, 12.0, 5.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.4228515625, -0.4084587097167969, -0.39406585693359375, -0.3796730041503906, -0.3652801513671875, -0.3508872985839844, -0.33649444580078125, -0.3221015930175781, -0.307708740234375, -0.2933158874511719, -0.27892303466796875, -0.2645301818847656, -0.2501373291015625, -0.23574447631835938, -0.22135162353515625, -0.20695877075195312, -0.19256591796875, -0.17817306518554688, -0.16378021240234375, -0.14938735961914062, -0.1349945068359375, -0.12060165405273438, -0.10620880126953125, -0.09181594848632812, -0.077423095703125, -0.06303024291992188, -0.04863739013671875, -0.034244537353515625, -0.0198516845703125, -0.005458831787109375, 0.00893402099609375, 0.023326873779296875, 0.0377197265625, 0.052112579345703125, 0.06650543212890625, 0.08089828491210938, 0.0952911376953125, 0.10968399047851562, 0.12407684326171875, 0.13846969604492188, 0.152862548828125, 0.16725540161132812, 0.18164825439453125, 0.19604110717773438, 0.2104339599609375, 0.22482681274414062, 0.23921966552734375, 0.2536125183105469, 0.26800537109375, 0.2823982238769531, 0.29679107666015625, 0.3111839294433594, 0.3255767822265625, 0.3399696350097656, 0.35436248779296875, 0.3687553405761719, 0.383148193359375, 0.3975410461425781, 0.41193389892578125, 0.4263267517089844, 0.4407196044921875, 0.4551124572753906, 0.46950531005859375, 0.4838981628417969, 0.498291015625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 4.0, 7.0, 5.0, 9.0, 9.0, 21.0, 18.0, 21.0, 37.0, 50.0, 94.0, 99.0, 182.0, 312.0, 423.0, 602.0, 658.0, 509.0, 361.0, 215.0, 145.0, 95.0, 56.0, 42.0, 29.0, 20.0, 15.0, 13.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1890869140625, -0.18215370178222656, -0.17522048950195312, -0.1682872772216797, -0.16135406494140625, -0.1544208526611328, -0.14748764038085938, -0.14055442810058594, -0.1336212158203125, -0.12668800354003906, -0.11975479125976562, -0.11282157897949219, -0.10588836669921875, -0.09895515441894531, -0.09202194213867188, -0.08508872985839844, -0.078155517578125, -0.07122230529785156, -0.06428909301757812, -0.05735588073730469, -0.05042266845703125, -0.04348945617675781, -0.036556243896484375, -0.029623031616210938, -0.0226898193359375, -0.015756607055664062, -0.008823394775390625, -0.0018901824951171875, 0.00504302978515625, 0.011976242065429688, 0.018909454345703125, 0.025842666625976562, 0.03277587890625, 0.03970909118652344, 0.046642303466796875, 0.05357551574707031, 0.06050872802734375, 0.06744194030761719, 0.07437515258789062, 0.08130836486816406, 0.0882415771484375, 0.09517478942871094, 0.10210800170898438, 0.10904121398925781, 0.11597442626953125, 0.12290763854980469, 0.12984085083007812, 0.13677406311035156, 0.143707275390625, 0.15064048767089844, 0.15757369995117188, 0.1645069122314453, 0.17144012451171875, 0.1783733367919922, 0.18530654907226562, 0.19223976135253906, 0.1991729736328125, 0.20610618591308594, 0.21303939819335938, 0.2199726104736328, 0.22690582275390625, 0.2338390350341797, 0.24077224731445312, 0.24770545959472656, 0.254638671875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 9.0, 28.0, 48.0, 122.0, 211.0, 243.0, 178.0, 84.0, 43.0, 16.0, 7.0, 4.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.689993381500244, -4.591251850128174, -4.492509841918945, -4.393768310546875, -4.2950263023376465, -4.196284770965576, -4.097542762756348, -3.9988012313842773, -3.900059700012207, -3.8013179302215576, -3.702576160430908, -3.603834629058838, -3.5050928592681885, -3.406351089477539, -3.3076093196868896, -3.2088675498962402, -3.110125780105591, -3.0113840103149414, -2.912642240524292, -2.8139004707336426, -2.7151589393615723, -2.616417169570923, -2.5176753997802734, -2.418933629989624, -2.3201918601989746, -2.221450090408325, -2.122708320617676, -2.0239667892456055, -1.925225019454956, -1.8264832496643066, -1.7277414798736572, -1.6289997100830078, -1.5302579402923584, -1.431516170501709, -1.3327745199203491, -1.2340327501296997, -1.1352910995483398, -1.0365493297576904, -0.937807559967041, -0.8390658497810364, -0.7403241395950317, -0.6415824294090271, -0.5428407192230225, -0.44409894943237305, -0.3453572392463684, -0.24661552906036377, -0.14787375926971436, -0.04913204908370972, 0.04960966110229492, 0.14835138618946075, 0.2470931112766266, 0.3458348512649536, 0.44457656145095825, 0.5433182716369629, 0.6420600414276123, 0.7408017516136169, 0.8395434617996216, 0.9382851719856262, 1.0370268821716309, 1.1357686519622803, 1.2345104217529297, 1.3332520723342896, 1.431993842124939, 1.5307354927062988, 1.6294772624969482]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 6.0, 4.0, 13.0, 17.0, 10.0, 20.0, 18.0, 20.0, 22.0, 18.0, 36.0, 36.0, 46.0, 50.0, 47.0, 47.0, 55.0, 52.0, 51.0, 65.0, 48.0, 50.0, 34.0, 26.0, 39.0, 33.0, 23.0, 25.0, 19.0, 15.0, 14.0, 8.0, 9.0, 10.0, 5.0, 3.0, 2.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0728849172592163, -1.0371637344360352, -1.001442551612854, -0.9657214283943176, -0.9300003051757812, -0.8942791223526001, -0.858557939529419, -0.8228368163108826, -0.7871156930923462, -0.751394510269165, -0.7156733870506287, -0.6799522042274475, -0.6442310810089111, -0.60850989818573, -0.5727887153625488, -0.5370675921440125, -0.5013464093208313, -0.46562525629997253, -0.42990410327911377, -0.3941829204559326, -0.35846179723739624, -0.3227406144142151, -0.2870194613933563, -0.25129830837249756, -0.2155771553516388, -0.17985600233078003, -0.14413484930992126, -0.1084136813879013, -0.07269252836704254, -0.03697137534618378, -0.0012502074241638184, 0.034470945596694946, 0.07019209861755371, 0.10591325163841248, 0.14163440465927124, 0.1773555725812912, 0.21307672560214996, 0.24879787862300873, 0.2845190465450287, 0.32024019956588745, 0.3559613525867462, 0.391682505607605, 0.42740365862846375, 0.4631248116493225, 0.49884599447250366, 0.53456711769104, 0.5702883005142212, 0.6060094833374023, 0.6417306065559387, 0.6774517893791199, 0.7131729125976562, 0.7488940954208374, 0.7846152186393738, 0.8203364014625549, 0.8560575246810913, 0.8917787075042725, 0.9274998903274536, 0.9632210731506348, 0.9989421963691711, 1.0346633195877075, 1.0703845024108887, 1.1061056852340698, 1.141826868057251, 1.1775479316711426, 1.2132691144943237]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 4.0, 3.0, 7.0, 6.0, 11.0, 23.0, 24.0, 31.0, 41.0, 108.0, 138.0, 285.0, 597.0, 1109.0, 2907.0, 7747.0, 24772.0, 93797.0, 406248.0, 386518.0, 88075.0, 23259.0, 7563.0, 2822.0, 1235.0, 559.0, 285.0, 125.0, 88.0, 56.0, 28.0, 31.0, 16.0, 11.0, 6.0, 4.0, 5.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.212890625, -0.2068042755126953, -0.20071792602539062, -0.19463157653808594, -0.18854522705078125, -0.18245887756347656, -0.17637252807617188, -0.1702861785888672, -0.1641998291015625, -0.1581134796142578, -0.15202713012695312, -0.14594078063964844, -0.13985443115234375, -0.13376808166503906, -0.12768173217773438, -0.12159538269042969, -0.115509033203125, -0.10942268371582031, -0.10333633422851562, -0.09724998474121094, -0.09116363525390625, -0.08507728576660156, -0.07899093627929688, -0.07290458679199219, -0.0668182373046875, -0.06073188781738281, -0.054645538330078125, -0.04855918884277344, -0.04247283935546875, -0.03638648986816406, -0.030300140380859375, -0.024213790893554688, -0.01812744140625, -0.012041091918945312, -0.005954742431640625, 0.0001316070556640625, 0.00621795654296875, 0.012304306030273438, 0.018390655517578125, 0.024477005004882812, 0.0305633544921875, 0.03664970397949219, 0.042736053466796875, 0.04882240295410156, 0.05490875244140625, 0.06099510192871094, 0.06708145141601562, 0.07316780090332031, 0.079254150390625, 0.08534049987792969, 0.09142684936523438, 0.09751319885253906, 0.10359954833984375, 0.10968589782714844, 0.11577224731445312, 0.12185859680175781, 0.1279449462890625, 0.1340312957763672, 0.14011764526367188, 0.14620399475097656, 0.15229034423828125, 0.15837669372558594, 0.16446304321289062, 0.1705493927001953, 0.1766357421875]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 7.0, 6.0, 5.0, 9.0, 19.0, 18.0, 27.0, 39.0, 46.0, 50.0, 55.0, 62.0, 64.0, 57.0, 72.0, 69.0, 56.0, 46.0, 60.0, 46.0, 33.0, 28.0, 27.0, 24.0, 23.0, 15.0, 11.0, 5.0, 4.0, 7.0, 4.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1419677734375, -0.1368236541748047, -0.13167953491210938, -0.12653541564941406, -0.12139129638671875, -0.11624717712402344, -0.11110305786132812, -0.10595893859863281, -0.1008148193359375, -0.09567070007324219, -0.09052658081054688, -0.08538246154785156, -0.08023834228515625, -0.07509422302246094, -0.06995010375976562, -0.06480598449707031, -0.059661865234375, -0.05451774597167969, -0.049373626708984375, -0.04422950744628906, -0.03908538818359375, -0.03394126892089844, -0.028797149658203125, -0.023653030395507812, -0.0185089111328125, -0.013364791870117188, -0.008220672607421875, -0.0030765533447265625, 0.00206756591796875, 0.0072116851806640625, 0.012355804443359375, 0.017499923706054688, 0.02264404296875, 0.027788162231445312, 0.032932281494140625, 0.03807640075683594, 0.04322052001953125, 0.04836463928222656, 0.053508758544921875, 0.05865287780761719, 0.0637969970703125, 0.06894111633300781, 0.07408523559570312, 0.07922935485839844, 0.08437347412109375, 0.08951759338378906, 0.09466171264648438, 0.09980583190917969, 0.104949951171875, 0.11009407043457031, 0.11523818969726562, 0.12038230895996094, 0.12552642822265625, 0.13067054748535156, 0.13581466674804688, 0.1409587860107422, 0.1461029052734375, 0.1512470245361328, 0.15639114379882812, 0.16153526306152344, 0.16667938232421875, 0.17182350158691406, 0.17696762084960938, 0.1821117401123047, 0.187255859375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 7.0, 5.0, 4.0, 12.0, 17.0, 19.0, 21.0, 36.0, 52.0, 69.0, 92.0, 190.0, 318.0, 518.0, 1200.0, 3530.0, 20933.0, 435219.0, 558414.0, 21711.0, 3589.0, 1207.0, 583.0, 325.0, 165.0, 95.0, 77.0, 63.0, 30.0, 17.0, 9.0, 3.0, 8.0, 8.0, 7.0, 3.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4365234375, -0.4236869812011719, -0.41085052490234375, -0.3980140686035156, -0.3851776123046875, -0.3723411560058594, -0.35950469970703125, -0.3466682434082031, -0.333831787109375, -0.3209953308105469, -0.30815887451171875, -0.2953224182128906, -0.2824859619140625, -0.2696495056152344, -0.25681304931640625, -0.24397659301757812, -0.23114013671875, -0.21830368041992188, -0.20546722412109375, -0.19263076782226562, -0.1797943115234375, -0.16695785522460938, -0.15412139892578125, -0.14128494262695312, -0.128448486328125, -0.11561203002929688, -0.10277557373046875, -0.08993911743164062, -0.0771026611328125, -0.06426620483398438, -0.05142974853515625, -0.038593292236328125, -0.0257568359375, -0.012920379638671875, -8.392333984375e-05, 0.012752532958984375, 0.0255889892578125, 0.038425445556640625, 0.05126190185546875, 0.06409835815429688, 0.076934814453125, 0.08977127075195312, 0.10260772705078125, 0.11544418334960938, 0.1282806396484375, 0.14111709594726562, 0.15395355224609375, 0.16679000854492188, 0.17962646484375, 0.19246292114257812, 0.20529937744140625, 0.21813583374023438, 0.2309722900390625, 0.24380874633789062, 0.25664520263671875, 0.2694816589355469, 0.282318115234375, 0.2951545715332031, 0.30799102783203125, 0.3208274841308594, 0.3336639404296875, 0.3465003967285156, 0.35933685302734375, 0.3721733093261719, 0.385009765625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 9.0, 6.0, 5.0, 13.0, 9.0, 13.0, 34.0, 29.0, 37.0, 38.0, 37.0, 64.0, 63.0, 59.0, 74.0, 78.0, 65.0, 61.0, 50.0, 45.0, 41.0, 41.0, 28.0, 23.0, 26.0, 10.0, 12.0, 7.0, 7.0, 4.0, 2.0, 5.0, 3.0, 2.0, 4.0, 0.0, 3.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.67041015625, -0.6506729125976562, -0.6309356689453125, -0.6111984252929688, -0.591461181640625, -0.5717239379882812, -0.5519866943359375, -0.5322494506835938, -0.51251220703125, -0.49277496337890625, -0.4730377197265625, -0.45330047607421875, -0.433563232421875, -0.41382598876953125, -0.3940887451171875, -0.37435150146484375, -0.3546142578125, -0.33487701416015625, -0.3151397705078125, -0.29540252685546875, -0.275665283203125, -0.25592803955078125, -0.2361907958984375, -0.21645355224609375, -0.19671630859375, -0.17697906494140625, -0.1572418212890625, -0.13750457763671875, -0.117767333984375, -0.09803009033203125, -0.0782928466796875, -0.05855560302734375, -0.038818359375, -0.01908111572265625, 0.0006561279296875, 0.02039337158203125, 0.040130615234375, 0.05986785888671875, 0.0796051025390625, 0.09934234619140625, 0.11907958984375, 0.13881683349609375, 0.1585540771484375, 0.17829132080078125, 0.198028564453125, 0.21776580810546875, 0.2375030517578125, 0.25724029541015625, 0.2769775390625, 0.29671478271484375, 0.3164520263671875, 0.33618927001953125, 0.355926513671875, 0.37566375732421875, 0.3954010009765625, 0.41513824462890625, 0.43487548828125, 0.45461273193359375, 0.4743499755859375, 0.49408721923828125, 0.513824462890625, 0.5335617065429688, 0.5532989501953125, 0.5730361938476562, 0.5927734375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 6.0, 5.0, 10.0, 8.0, 17.0, 20.0, 22.0, 38.0, 76.0, 109.0, 181.0, 318.0, 602.0, 1454.0, 3683.0, 11631.0, 50855.0, 757821.0, 183913.0, 26238.0, 7046.0, 2404.0, 948.0, 511.0, 249.0, 130.0, 79.0, 47.0, 37.0, 21.0, 22.0, 18.0, 7.0, 10.0, 5.0, 4.0, 2.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1136474609375, -0.10995674133300781, -0.10626602172851562, -0.10257530212402344, -0.09888458251953125, -0.09519386291503906, -0.09150314331054688, -0.08781242370605469, -0.0841217041015625, -0.08043098449707031, -0.07674026489257812, -0.07304954528808594, -0.06935882568359375, -0.06566810607910156, -0.061977386474609375, -0.05828666687011719, -0.054595947265625, -0.05090522766113281, -0.047214508056640625, -0.04352378845214844, -0.03983306884765625, -0.03614234924316406, -0.032451629638671875, -0.028760910034179688, -0.0250701904296875, -0.021379470825195312, -0.017688751220703125, -0.013998031616210938, -0.01030731201171875, -0.0066165924072265625, -0.002925872802734375, 0.0007648468017578125, 0.00445556640625, 0.008146286010742188, 0.011837005615234375, 0.015527725219726562, 0.01921844482421875, 0.022909164428710938, 0.026599884033203125, 0.030290603637695312, 0.0339813232421875, 0.03767204284667969, 0.041362762451171875, 0.04505348205566406, 0.04874420166015625, 0.05243492126464844, 0.056125640869140625, 0.05981636047363281, 0.063507080078125, 0.06719779968261719, 0.07088851928710938, 0.07457923889160156, 0.07826995849609375, 0.08196067810058594, 0.08565139770507812, 0.08934211730957031, 0.0930328369140625, 0.09672355651855469, 0.10041427612304688, 0.10410499572753906, 0.10779571533203125, 0.11148643493652344, 0.11517715454101562, 0.11886787414550781, 0.12255859375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 6.0, 10.0, 4.0, 5.0, 6.0, 10.0, 20.0, 11.0, 17.0, 17.0, 37.0, 43.0, 64.0, 58.0, 80.0, 68.0, 78.0, 82.0, 75.0, 54.0, 51.0, 48.0, 27.0, 30.0, 20.0, 20.0, 10.0, 5.0, 5.0, 8.0, 8.0, 6.0, 3.0, 1.0, 4.0, 3.0, 5.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.8789043426513672e-05, -2.7704983949661255e-05, -2.6620924472808838e-05, -2.553686499595642e-05, -2.4452805519104004e-05, -2.3368746042251587e-05, -2.228468656539917e-05, -2.1200627088546753e-05, -2.0116567611694336e-05, -1.903250813484192e-05, -1.7948448657989502e-05, -1.6864389181137085e-05, -1.5780329704284668e-05, -1.4696270227432251e-05, -1.3612210750579834e-05, -1.2528151273727417e-05, -1.1444091796875e-05, -1.0360032320022583e-05, -9.275972843170166e-06, -8.191913366317749e-06, -7.107853889465332e-06, -6.023794412612915e-06, -4.939734935760498e-06, -3.855675458908081e-06, -2.771615982055664e-06, -1.687556505203247e-06, -6.034970283508301e-07, 4.805624485015869e-07, 1.564621925354004e-06, 2.648681402206421e-06, 3.732740879058838e-06, 4.816800355911255e-06, 5.900859832763672e-06, 6.984919309616089e-06, 8.068978786468506e-06, 9.153038263320923e-06, 1.023709774017334e-05, 1.1321157217025757e-05, 1.2405216693878174e-05, 1.348927617073059e-05, 1.4573335647583008e-05, 1.5657395124435425e-05, 1.6741454601287842e-05, 1.782551407814026e-05, 1.8909573554992676e-05, 1.9993633031845093e-05, 2.107769250869751e-05, 2.2161751985549927e-05, 2.3245811462402344e-05, 2.432987093925476e-05, 2.5413930416107178e-05, 2.6497989892959595e-05, 2.7582049369812012e-05, 2.866610884666443e-05, 2.9750168323516846e-05, 3.083422780036926e-05, 3.191828727722168e-05, 3.30023467540741e-05, 3.4086406230926514e-05, 3.517046570777893e-05, 3.625452518463135e-05, 3.7338584661483765e-05, 3.842264413833618e-05, 3.95067036151886e-05, 4.0590763092041016e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 5.0, 0.0, 5.0, 11.0, 14.0, 13.0, 15.0, 27.0, 54.0, 64.0, 129.0, 256.0, 489.0, 1246.0, 3837.0, 16357.0, 123464.0, 826996.0, 60678.0, 10548.0, 2571.0, 891.0, 396.0, 201.0, 112.0, 64.0, 35.0, 24.0, 19.0, 13.0, 9.0, 7.0, 4.0, 5.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.138427734375, -0.13401222229003906, -0.12959671020507812, -0.1251811981201172, -0.12076568603515625, -0.11635017395019531, -0.11193466186523438, -0.10751914978027344, -0.1031036376953125, -0.09868812561035156, -0.09427261352539062, -0.08985710144042969, -0.08544158935546875, -0.08102607727050781, -0.07661056518554688, -0.07219505310058594, -0.067779541015625, -0.06336402893066406, -0.058948516845703125, -0.05453300476074219, -0.05011749267578125, -0.04570198059082031, -0.041286468505859375, -0.03687095642089844, -0.0324554443359375, -0.028039932250976562, -0.023624420166015625, -0.019208908081054688, -0.01479339599609375, -0.010377883911132812, -0.005962371826171875, -0.0015468597412109375, 0.00286865234375, 0.0072841644287109375, 0.011699676513671875, 0.016115188598632812, 0.02053070068359375, 0.024946212768554688, 0.029361724853515625, 0.03377723693847656, 0.0381927490234375, 0.04260826110839844, 0.047023773193359375, 0.05143928527832031, 0.05585479736328125, 0.06027030944824219, 0.06468582153320312, 0.06910133361816406, 0.073516845703125, 0.07793235778808594, 0.08234786987304688, 0.08676338195800781, 0.09117889404296875, 0.09559440612792969, 0.10000991821289062, 0.10442543029785156, 0.1088409423828125, 0.11325645446777344, 0.11767196655273438, 0.12208747863769531, 0.12650299072265625, 0.1309185028076172, 0.13533401489257812, 0.13974952697753906, 0.1441650390625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 2.0, 6.0, 6.0, 7.0, 6.0, 4.0, 16.0, 16.0, 20.0, 33.0, 30.0, 57.0, 89.0, 95.0, 161.0, 134.0, 99.0, 64.0, 42.0, 23.0, 20.0, 25.0, 8.0, 10.0, 8.0, 8.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.123046875, -0.1194000244140625, -0.115753173828125, -0.1121063232421875, -0.10845947265625, -0.1048126220703125, -0.101165771484375, -0.0975189208984375, -0.0938720703125, -0.0902252197265625, -0.086578369140625, -0.0829315185546875, -0.07928466796875, -0.0756378173828125, -0.071990966796875, -0.0683441162109375, -0.064697265625, -0.0610504150390625, -0.057403564453125, -0.0537567138671875, -0.05010986328125, -0.0464630126953125, -0.042816162109375, -0.0391693115234375, -0.0355224609375, -0.0318756103515625, -0.028228759765625, -0.0245819091796875, -0.02093505859375, -0.0172882080078125, -0.013641357421875, -0.0099945068359375, -0.00634765625, -0.0027008056640625, 0.000946044921875, 0.0045928955078125, 0.00823974609375, 0.0118865966796875, 0.015533447265625, 0.0191802978515625, 0.0228271484375, 0.0264739990234375, 0.030120849609375, 0.0337677001953125, 0.03741455078125, 0.0410614013671875, 0.044708251953125, 0.0483551025390625, 0.052001953125, 0.0556488037109375, 0.059295654296875, 0.0629425048828125, 0.06658935546875, 0.0702362060546875, 0.073883056640625, 0.0775299072265625, 0.0811767578125, 0.0848236083984375, 0.088470458984375, 0.0921173095703125, 0.09576416015625, 0.0994110107421875, 0.103057861328125, 0.1067047119140625, 0.1103515625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 8.0, 11.0, 39.0, 138.0, 534.0, 191.0, 54.0, 15.0, 7.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.045783996582031, -5.881122589111328, -5.716460704803467, -5.551799297332764, -5.3871378898620605, -5.222476005554199, -5.057814598083496, -4.893153190612793, -4.72849178314209, -4.563830375671387, -4.399168491363525, -4.234507083892822, -4.069845676422119, -3.905184030532837, -3.7405223846435547, -3.5758609771728516, -3.4111990928649902, -3.246537446975708, -3.081876039505005, -2.9172143936157227, -2.7525529861450195, -2.5878913402557373, -2.423229694366455, -2.258568286895752, -2.0939066410064697, -1.929245114326477, -1.7645835876464844, -1.5999219417572021, -1.4352604150772095, -1.2705988883972168, -1.1059372425079346, -0.9412757158279419, -0.776613712310791, -0.6119521856307983, -0.4472905993461609, -0.2826290428638458, -0.11796748638153076, 0.046694040298461914, 0.21135562658309937, 0.3760172128677368, 0.5406787395477295, 0.7053402662277222, 0.8700018525123596, 1.034663438796997, 1.1993249654769897, 1.3639864921569824, 1.5286481380462646, 1.6933096647262573, 1.85797119140625, 2.0226328372955322, 2.1872942447662354, 2.3519558906555176, 2.5166172981262207, 2.681278944015503, 2.845940589904785, 3.0106019973754883, 3.1752636432647705, 3.3399252891540527, 3.504586696624756, 3.669248342514038, 3.8339099884033203, 3.9985713958740234, 4.163232803344727, 4.327894687652588, 4.492556095123291]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 7.0, 5.0, 6.0, 9.0, 5.0, 11.0, 10.0, 23.0, 15.0, 19.0, 19.0, 15.0, 26.0, 22.0, 24.0, 37.0, 47.0, 80.0, 156.0, 122.0, 63.0, 32.0, 29.0, 25.0, 37.0, 20.0, 13.0, 19.0, 16.0, 21.0, 15.0, 19.0, 10.0, 3.0, 4.0, 7.0, 3.0, 6.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.999355435371399, -1.9382165670394897, -1.8770778179168701, -1.815938949584961, -1.7548000812530518, -1.6936612129211426, -1.632522463798523, -1.5713835954666138, -1.5102448463439941, -1.449105978012085, -1.3879672288894653, -1.3268283605575562, -1.265689492225647, -1.2045507431030273, -1.1434118747711182, -1.082273006439209, -1.0211341381072998, -0.9599953293800354, -0.8988564610481262, -0.8377176523208618, -0.7765787839889526, -0.7154399752616882, -0.6543011665344238, -0.5931622982025146, -0.5320234894752502, -0.47088465094566345, -0.40974581241607666, -0.34860700368881226, -0.28746816515922546, -0.22632932662963867, -0.16519051790237427, -0.10405167937278748, -0.042912960052490234, 0.01822587102651596, 0.07936470210552216, 0.14050352573394775, 0.20164236426353455, 0.26278120279312134, 0.32392001152038574, 0.38505885004997253, 0.4461976885795593, 0.5073364973068237, 0.5684753656387329, 0.6296141743659973, 0.6907529830932617, 0.7518918514251709, 0.8130306601524353, 0.8741694688796997, 0.9353083372116089, 0.9964471459388733, 1.0575859546661377, 1.1187248229980469, 1.179863691329956, 1.2410025596618652, 1.3021413087844849, 1.363280177116394, 1.4244189262390137, 1.4855577945709229, 1.5466965436935425, 1.6078354120254517, 1.6689742803573608, 1.7301130294799805, 1.7912518978118896, 1.8523907661437988, 1.913529634475708]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 5.0, 7.0, 8.0, 6.0, 15.0, 20.0, 27.0, 57.0, 119.0, 242.0, 489.0, 1202.0, 3312.0, 11317.0, 68823.0, 953711.0, 2773752.0, 341210.0, 30017.0, 6442.0, 2046.0, 795.0, 342.0, 133.0, 81.0, 38.0, 23.0, 17.0, 9.0, 6.0, 3.0, 1.0, 8.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.306396484375, -0.29628753662109375, -0.2861785888671875, -0.27606964111328125, -0.265960693359375, -0.25585174560546875, -0.2457427978515625, -0.23563385009765625, -0.22552490234375, -0.21541595458984375, -0.2053070068359375, -0.19519805908203125, -0.185089111328125, -0.17498016357421875, -0.1648712158203125, -0.15476226806640625, -0.1446533203125, -0.13454437255859375, -0.1244354248046875, -0.11432647705078125, -0.104217529296875, -0.09410858154296875, -0.0839996337890625, -0.07389068603515625, -0.06378173828125, -0.05367279052734375, -0.0435638427734375, -0.03345489501953125, -0.023345947265625, -0.01323699951171875, -0.0031280517578125, 0.00698089599609375, 0.01708984375, 0.02719879150390625, 0.0373077392578125, 0.04741668701171875, 0.057525634765625, 0.06763458251953125, 0.0777435302734375, 0.08785247802734375, 0.09796142578125, 0.10807037353515625, 0.1181793212890625, 0.12828826904296875, 0.138397216796875, 0.14850616455078125, 0.1586151123046875, 0.16872406005859375, 0.1788330078125, 0.18894195556640625, 0.1990509033203125, 0.20915985107421875, 0.219268798828125, 0.22937774658203125, 0.2394866943359375, 0.24959564208984375, 0.25970458984375, 0.26981353759765625, 0.2799224853515625, 0.29003143310546875, 0.300140380859375, 0.31024932861328125, 0.3203582763671875, 0.33046722412109375, 0.340576171875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 3.0, 1.0, 4.0, 4.0, 4.0, 3.0, 3.0, 9.0, 11.0, 10.0, 17.0, 37.0, 38.0, 46.0, 47.0, 46.0, 50.0, 55.0, 61.0, 74.0, 65.0, 54.0, 52.0, 49.0, 51.0, 49.0, 22.0, 37.0, 23.0, 19.0, 16.0, 11.0, 13.0, 8.0, 5.0, 5.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1346435546875, -0.12982749938964844, -0.12501144409179688, -0.12019538879394531, -0.11537933349609375, -0.11056327819824219, -0.10574722290039062, -0.10093116760253906, -0.0961151123046875, -0.09129905700683594, -0.08648300170898438, -0.08166694641113281, -0.07685089111328125, -0.07203483581542969, -0.06721878051757812, -0.06240272521972656, -0.057586669921875, -0.05277061462402344, -0.047954559326171875, -0.04313850402832031, -0.03832244873046875, -0.03350639343261719, -0.028690338134765625, -0.023874282836914062, -0.0190582275390625, -0.014242172241210938, -0.009426116943359375, -0.0046100616455078125, 0.00020599365234375, 0.0050220489501953125, 0.009838104248046875, 0.014654159545898438, 0.01947021484375, 0.024286270141601562, 0.029102325439453125, 0.03391838073730469, 0.03873443603515625, 0.04355049133300781, 0.048366546630859375, 0.05318260192871094, 0.0579986572265625, 0.06281471252441406, 0.06763076782226562, 0.07244682312011719, 0.07726287841796875, 0.08207893371582031, 0.08689498901367188, 0.09171104431152344, 0.096527099609375, 0.10134315490722656, 0.10615921020507812, 0.11097526550292969, 0.11579132080078125, 0.12060737609863281, 0.12542343139648438, 0.13023948669433594, 0.1350555419921875, 0.13987159729003906, 0.14468765258789062, 0.1495037078857422, 0.15431976318359375, 0.1591358184814453, 0.16395187377929688, 0.16876792907714844, 0.173583984375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 5.0, 7.0, 12.0, 25.0, 39.0, 103.0, 307.0, 866.0, 3695.0, 1578189.0, 2605820.0, 3889.0, 865.0, 262.0, 92.0, 46.0, 21.0, 10.0, 7.0, 9.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8935546875, -1.8361968994140625, -1.778839111328125, -1.7214813232421875, -1.66412353515625, -1.6067657470703125, -1.549407958984375, -1.4920501708984375, -1.4346923828125, -1.3773345947265625, -1.319976806640625, -1.2626190185546875, -1.20526123046875, -1.1479034423828125, -1.090545654296875, -1.0331878662109375, -0.975830078125, -0.9184722900390625, -0.861114501953125, -0.8037567138671875, -0.74639892578125, -0.6890411376953125, -0.631683349609375, -0.5743255615234375, -0.5169677734375, -0.4596099853515625, -0.402252197265625, -0.3448944091796875, -0.28753662109375, -0.2301788330078125, -0.172821044921875, -0.1154632568359375, -0.05810546875, -0.0007476806640625, 0.056610107421875, 0.1139678955078125, 0.17132568359375, 0.2286834716796875, 0.286041259765625, 0.3433990478515625, 0.4007568359375, 0.4581146240234375, 0.515472412109375, 0.5728302001953125, 0.63018798828125, 0.6875457763671875, 0.744903564453125, 0.8022613525390625, 0.859619140625, 0.9169769287109375, 0.974334716796875, 1.0316925048828125, 1.08905029296875, 1.1464080810546875, 1.203765869140625, 1.2611236572265625, 1.3184814453125, 1.3758392333984375, 1.433197021484375, 1.4905548095703125, 1.54791259765625, 1.6052703857421875, 1.662628173828125, 1.7199859619140625, 1.77734375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 7.0, 5.0, 15.0, 43.0, 102.0, 310.0, 838.0, 1516.0, 736.0, 309.0, 118.0, 48.0, 14.0, 14.0, 6.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0908203125, -1.054962158203125, -1.01910400390625, -0.983245849609375, -0.9473876953125, -0.911529541015625, -0.87567138671875, -0.839813232421875, -0.803955078125, -0.768096923828125, -0.73223876953125, -0.696380615234375, -0.6605224609375, -0.624664306640625, -0.58880615234375, -0.552947998046875, -0.51708984375, -0.481231689453125, -0.44537353515625, -0.409515380859375, -0.3736572265625, -0.337799072265625, -0.30194091796875, -0.266082763671875, -0.230224609375, -0.194366455078125, -0.15850830078125, -0.122650146484375, -0.0867919921875, -0.050933837890625, -0.01507568359375, 0.020782470703125, 0.056640625, 0.092498779296875, 0.12835693359375, 0.164215087890625, 0.2000732421875, 0.235931396484375, 0.27178955078125, 0.307647705078125, 0.343505859375, 0.379364013671875, 0.41522216796875, 0.451080322265625, 0.4869384765625, 0.522796630859375, 0.55865478515625, 0.594512939453125, 0.63037109375, 0.666229248046875, 0.70208740234375, 0.737945556640625, 0.7738037109375, 0.809661865234375, 0.84552001953125, 0.881378173828125, 0.917236328125, 0.953094482421875, 0.98895263671875, 1.024810791015625, 1.0606689453125, 1.096527099609375, 1.13238525390625, 1.168243408203125, 1.2041015625]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 8.0, 5.0, 8.0, 12.0, 21.0, 60.0, 173.0, 293.0, 242.0, 102.0, 35.0, 18.0, 10.0, 2.0, 9.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-11.934843063354492, -11.661642074584961, -11.388440132141113, -11.115239143371582, -10.84203815460205, -10.56883716583252, -10.295635223388672, -10.02243423461914, -9.74923324584961, -9.476032257080078, -9.20283031463623, -8.9296293258667, -8.656428337097168, -8.383227348327637, -8.110025405883789, -7.836824417114258, -7.563622951507568, -7.290421485900879, -7.017220497131348, -6.744019031524658, -6.470818042755127, -6.1976165771484375, -5.924415588378906, -5.651214122772217, -5.378012657165527, -5.104811191558838, -4.831610202789307, -4.558408737182617, -4.285207748413086, -4.0120062828063965, -3.738805055618286, -3.465603828430176, -3.1924033164978027, -2.9192020893096924, -2.646000862121582, -2.3727993965148926, -2.0995984077453613, -1.8263970613479614, -1.5531957149505615, -1.2799944877624512, -1.0067932605743408, -0.7335920333862305, -0.46039074659347534, -0.18718945980072021, 0.08601176738739014, 0.3592129945755005, 0.6324143409729004, 0.9056155681610107, 1.178816795349121, 1.4520180225372314, 1.7252192497253418, 1.9984205961227417, 2.2716217041015625, 2.544823169708252, 2.8180243968963623, 3.0912256240844727, 3.364426851272583, 3.6376280784606934, 3.9108293056488037, 4.184030532836914, 4.4572319984436035, 4.730432987213135, 5.003634452819824, 5.2768354415893555, 5.550036907196045]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 4.0, 4.0, 11.0, 10.0, 9.0, 19.0, 32.0, 34.0, 46.0, 50.0, 51.0, 75.0, 77.0, 81.0, 85.0, 76.0, 69.0, 57.0, 51.0, 44.0, 33.0, 25.0, 15.0, 12.0, 12.0, 8.0, 5.0, 5.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.180706024169922, -4.055411338806152, -3.930116653442383, -3.8048219680786133, -3.6795272827148438, -3.554232597351074, -3.4289379119873047, -3.303643226623535, -3.1783485412597656, -3.053053855895996, -2.9277591705322266, -2.802464485168457, -2.6771697998046875, -2.551875114440918, -2.4265804290771484, -2.301285743713379, -2.1759908199310303, -2.0506961345672607, -1.9254014492034912, -1.8001067638397217, -1.6748120784759521, -1.5495173931121826, -1.4242225885391235, -1.298927903175354, -1.1736332178115845, -1.048338532447815, -0.9230438470840454, -0.7977491021156311, -0.6724544167518616, -0.547159731388092, -0.42186498641967773, -0.2965703010559082, -0.17127585411071777, -0.04598115384578705, 0.07931354641914368, 0.2046082615852356, 0.3299029469490051, 0.45519763231277466, 0.580492377281189, 0.7057870626449585, 0.831081748008728, 0.9563764333724976, 1.081671118736267, 1.2069659233093262, 1.3322606086730957, 1.4575552940368652, 1.5828499794006348, 1.7081446647644043, 1.8334393501281738, 1.9587340354919434, 2.084028720855713, 2.2093234062194824, 2.334618091583252, 2.4599127769470215, 2.585207462310791, 2.7105021476745605, 2.83579683303833, 2.9610915184020996, 3.086386203765869, 3.2116808891296387, 3.336975574493408, 3.4622702598571777, 3.5875649452209473, 3.712859630584717, 3.8381545543670654]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 6.0, 10.0, 15.0, 11.0, 25.0, 30.0, 47.0, 64.0, 104.0, 183.0, 367.0, 713.0, 1497.0, 3748.0, 11624.0, 51199.0, 502429.0, 413856.0, 45579.0, 10737.0, 3428.0, 1396.0, 656.0, 319.0, 201.0, 120.0, 67.0, 50.0, 21.0, 18.0, 11.0, 5.0, 7.0, 1.0, 4.0, 2.0, 0.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.33935546875, -0.33017539978027344, -0.3209953308105469, -0.3118152618408203, -0.30263519287109375, -0.2934551239013672, -0.2842750549316406, -0.27509498596191406, -0.2659149169921875, -0.25673484802246094, -0.24755477905273438, -0.2383747100830078, -0.22919464111328125, -0.2200145721435547, -0.21083450317382812, -0.20165443420410156, -0.192474365234375, -0.18329429626464844, -0.17411422729492188, -0.1649341583251953, -0.15575408935546875, -0.1465740203857422, -0.13739395141601562, -0.12821388244628906, -0.1190338134765625, -0.10985374450683594, -0.10067367553710938, -0.09149360656738281, -0.08231353759765625, -0.07313346862792969, -0.06395339965820312, -0.05477333068847656, -0.04559326171875, -0.03641319274902344, -0.027233123779296875, -0.018053054809570312, -0.00887298583984375, 0.0003070831298828125, 0.009487152099609375, 0.018667221069335938, 0.0278472900390625, 0.03702735900878906, 0.046207427978515625, 0.05538749694824219, 0.06456756591796875, 0.07374763488769531, 0.08292770385742188, 0.09210777282714844, 0.101287841796875, 0.11046791076660156, 0.11964797973632812, 0.1288280487060547, 0.13800811767578125, 0.1471881866455078, 0.15636825561523438, 0.16554832458496094, 0.1747283935546875, 0.18390846252441406, 0.19308853149414062, 0.2022686004638672, 0.21144866943359375, 0.2206287384033203, 0.22980880737304688, 0.23898887634277344, 0.2481689453125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 5.0, 6.0, 14.0, 14.0, 20.0, 28.0, 46.0, 55.0, 67.0, 95.0, 89.0, 110.0, 91.0, 84.0, 65.0, 59.0, 48.0, 34.0, 22.0, 14.0, 11.0, 7.0, 4.0, 5.0, 1.0, 2.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2958984375, -0.2862892150878906, -0.27667999267578125, -0.2670707702636719, -0.2574615478515625, -0.24785232543945312, -0.23824310302734375, -0.22863388061523438, -0.219024658203125, -0.20941543579101562, -0.19980621337890625, -0.19019699096679688, -0.1805877685546875, -0.17097854614257812, -0.16136932373046875, -0.15176010131835938, -0.14215087890625, -0.13254165649414062, -0.12293243408203125, -0.11332321166992188, -0.1037139892578125, -0.09410476684570312, -0.08449554443359375, -0.07488632202148438, -0.065277099609375, -0.055667877197265625, -0.04605865478515625, -0.036449432373046875, -0.0268402099609375, -0.017230987548828125, -0.00762176513671875, 0.001987457275390625, 0.0115966796875, 0.021205902099609375, 0.03081512451171875, 0.040424346923828125, 0.0500335693359375, 0.059642791748046875, 0.06925201416015625, 0.07886123657226562, 0.088470458984375, 0.09807968139648438, 0.10768890380859375, 0.11729812622070312, 0.1269073486328125, 0.13651657104492188, 0.14612579345703125, 0.15573501586914062, 0.16534423828125, 0.17495346069335938, 0.18456268310546875, 0.19417190551757812, 0.2037811279296875, 0.21339035034179688, 0.22299957275390625, 0.23260879516601562, 0.242218017578125, 0.2518272399902344, 0.26143646240234375, 0.2710456848144531, 0.2806549072265625, 0.2902641296386719, 0.29987335205078125, 0.3094825744628906, 0.319091796875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 7.0, 7.0, 5.0, 7.0, 6.0, 8.0, 17.0, 15.0, 23.0, 32.0, 36.0, 32.0, 49.0, 91.0, 126.0, 227.0, 338.0, 602.0, 1354.0, 4501.0, 28721.0, 858675.0, 136931.0, 11943.0, 2585.0, 911.0, 471.0, 262.0, 162.0, 91.0, 80.0, 54.0, 49.0, 27.0, 24.0, 19.0, 10.0, 14.0, 9.0, 9.0, 7.0, 4.0, 5.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0], "bins": [-0.3359375, -0.32537078857421875, -0.3148040771484375, -0.30423736572265625, -0.293670654296875, -0.28310394287109375, -0.2725372314453125, -0.26197052001953125, -0.25140380859375, -0.24083709716796875, -0.2302703857421875, -0.21970367431640625, -0.209136962890625, -0.19857025146484375, -0.1880035400390625, -0.17743682861328125, -0.1668701171875, -0.15630340576171875, -0.1457366943359375, -0.13516998291015625, -0.124603271484375, -0.11403656005859375, -0.1034698486328125, -0.09290313720703125, -0.08233642578125, -0.07176971435546875, -0.0612030029296875, -0.05063629150390625, -0.040069580078125, -0.02950286865234375, -0.0189361572265625, -0.00836944580078125, 0.002197265625, 0.01276397705078125, 0.0233306884765625, 0.03389739990234375, 0.044464111328125, 0.05503082275390625, 0.0655975341796875, 0.07616424560546875, 0.08673095703125, 0.09729766845703125, 0.1078643798828125, 0.11843109130859375, 0.128997802734375, 0.13956451416015625, 0.1501312255859375, 0.16069793701171875, 0.1712646484375, 0.18183135986328125, 0.1923980712890625, 0.20296478271484375, 0.213531494140625, 0.22409820556640625, 0.2346649169921875, 0.24523162841796875, 0.25579833984375, 0.26636505126953125, 0.2769317626953125, 0.28749847412109375, 0.298065185546875, 0.30863189697265625, 0.3191986083984375, 0.32976531982421875, 0.34033203125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 2.0, 4.0, 3.0, 6.0, 7.0, 5.0, 7.0, 12.0, 13.0, 9.0, 21.0, 20.0, 13.0, 26.0, 31.0, 39.0, 36.0, 61.0, 54.0, 65.0, 74.0, 80.0, 66.0, 54.0, 48.0, 33.0, 35.0, 23.0, 25.0, 25.0, 15.0, 19.0, 16.0, 8.0, 13.0, 5.0, 6.0, 5.0, 6.0, 2.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.6845703125, -0.6636428833007812, -0.6427154541015625, -0.6217880249023438, -0.600860595703125, -0.5799331665039062, -0.5590057373046875, -0.5380783081054688, -0.51715087890625, -0.49622344970703125, -0.4752960205078125, -0.45436859130859375, -0.433441162109375, -0.41251373291015625, -0.3915863037109375, -0.37065887451171875, -0.3497314453125, -0.32880401611328125, -0.3078765869140625, -0.28694915771484375, -0.266021728515625, -0.24509429931640625, -0.2241668701171875, -0.20323944091796875, -0.18231201171875, -0.16138458251953125, -0.1404571533203125, -0.11952972412109375, -0.098602294921875, -0.07767486572265625, -0.0567474365234375, -0.03582000732421875, -0.014892578125, 0.00603485107421875, 0.0269622802734375, 0.04788970947265625, 0.068817138671875, 0.08974456787109375, 0.1106719970703125, 0.13159942626953125, 0.15252685546875, 0.17345428466796875, 0.1943817138671875, 0.21530914306640625, 0.236236572265625, 0.25716400146484375, 0.2780914306640625, 0.29901885986328125, 0.3199462890625, 0.34087371826171875, 0.3618011474609375, 0.38272857666015625, 0.403656005859375, 0.42458343505859375, 0.4455108642578125, 0.46643829345703125, 0.48736572265625, 0.5082931518554688, 0.5292205810546875, 0.5501480102539062, 0.571075439453125, 0.5920028686523438, 0.6129302978515625, 0.6338577270507812, 0.65478515625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 6.0, 4.0, 4.0, 6.0, 11.0, 6.0, 16.0, 21.0, 21.0, 59.0, 61.0, 123.0, 208.0, 414.0, 1090.0, 3127.0, 14262.0, 169014.0, 830213.0, 22819.0, 4501.0, 1433.0, 550.0, 232.0, 123.0, 78.0, 42.0, 36.0, 22.0, 17.0, 13.0, 7.0, 6.0, 9.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07220458984375, -0.06995677947998047, -0.06770896911621094, -0.0654611587524414, -0.06321334838867188, -0.060965538024902344, -0.05871772766113281, -0.05646991729736328, -0.05422210693359375, -0.05197429656982422, -0.04972648620605469, -0.047478675842285156, -0.045230865478515625, -0.042983055114746094, -0.04073524475097656, -0.03848743438720703, -0.0362396240234375, -0.03399181365966797, -0.03174400329589844, -0.029496192932128906, -0.027248382568359375, -0.025000572204589844, -0.022752761840820312, -0.02050495147705078, -0.01825714111328125, -0.01600933074951172, -0.013761520385742188, -0.011513710021972656, -0.009265899658203125, -0.007018089294433594, -0.0047702789306640625, -0.0025224685668945312, -0.000274658203125, 0.0019731521606445312, 0.0042209625244140625, 0.006468772888183594, 0.008716583251953125, 0.010964393615722656, 0.013212203979492188, 0.015460014343261719, 0.01770782470703125, 0.01995563507080078, 0.022203445434570312, 0.024451255798339844, 0.026699066162109375, 0.028946876525878906, 0.031194686889648438, 0.03344249725341797, 0.0356903076171875, 0.03793811798095703, 0.04018592834472656, 0.042433738708496094, 0.044681549072265625, 0.046929359436035156, 0.04917716979980469, 0.05142498016357422, 0.05367279052734375, 0.05592060089111328, 0.05816841125488281, 0.060416221618652344, 0.06266403198242188, 0.0649118423461914, 0.06715965270996094, 0.06940746307373047, 0.0716552734375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 0.0, 7.0, 3.0, 5.0, 5.0, 11.0, 15.0, 10.0, 17.0, 31.0, 31.0, 37.0, 71.0, 91.0, 116.0, 140.0, 110.0, 78.0, 59.0, 34.0, 24.0, 29.0, 18.0, 20.0, 13.0, 6.0, 2.0, 14.0, 1.0, 7.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-5.4001808166503906e-05, -5.275662988424301e-05, -5.151145160198212e-05, -5.026627331972122e-05, -4.902109503746033e-05, -4.777591675519943e-05, -4.653073847293854e-05, -4.528556019067764e-05, -4.404038190841675e-05, -4.279520362615585e-05, -4.155002534389496e-05, -4.0304847061634064e-05, -3.905966877937317e-05, -3.7814490497112274e-05, -3.656931221485138e-05, -3.5324133932590485e-05, -3.407895565032959e-05, -3.2833777368068695e-05, -3.15885990858078e-05, -3.0343420803546906e-05, -2.909824252128601e-05, -2.7853064239025116e-05, -2.660788595676422e-05, -2.5362707674503326e-05, -2.411752939224243e-05, -2.2872351109981537e-05, -2.1627172827720642e-05, -2.0381994545459747e-05, -1.9136816263198853e-05, -1.7891637980937958e-05, -1.6646459698677063e-05, -1.5401281416416168e-05, -1.4156103134155273e-05, -1.2910924851894379e-05, -1.1665746569633484e-05, -1.0420568287372589e-05, -9.175390005111694e-06, -7.9302117228508e-06, -6.685033440589905e-06, -5.43985515832901e-06, -4.194676876068115e-06, -2.9494985938072205e-06, -1.7043203115463257e-06, -4.591420292854309e-07, 7.860362529754639e-07, 2.0312145352363586e-06, 3.2763928174972534e-06, 4.521571099758148e-06, 5.766749382019043e-06, 7.011927664279938e-06, 8.257105946540833e-06, 9.502284228801727e-06, 1.0747462511062622e-05, 1.1992640793323517e-05, 1.3237819075584412e-05, 1.4482997357845306e-05, 1.57281756401062e-05, 1.6973353922367096e-05, 1.821853220462799e-05, 1.9463710486888885e-05, 2.070888876914978e-05, 2.1954067051410675e-05, 2.319924533367157e-05, 2.4444423615932465e-05, 2.568960189819336e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 4.0, 2.0, 5.0, 8.0, 6.0, 15.0, 16.0, 20.0, 34.0, 49.0, 75.0, 99.0, 165.0, 322.0, 555.0, 1088.0, 2416.0, 5740.0, 16538.0, 64910.0, 814841.0, 105889.0, 22462.0, 7431.0, 2958.0, 1371.0, 657.0, 310.0, 197.0, 126.0, 69.0, 61.0, 26.0, 22.0, 21.0, 16.0, 14.0, 3.0, 4.0, 4.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.04925537109375, -0.04783296585083008, -0.046410560607910156, -0.044988155364990234, -0.04356575012207031, -0.04214334487915039, -0.04072093963623047, -0.03929853439331055, -0.037876129150390625, -0.0364537239074707, -0.03503131866455078, -0.03360891342163086, -0.03218650817871094, -0.030764102935791016, -0.029341697692871094, -0.027919292449951172, -0.02649688720703125, -0.025074481964111328, -0.023652076721191406, -0.022229671478271484, -0.020807266235351562, -0.01938486099243164, -0.01796245574951172, -0.016540050506591797, -0.015117645263671875, -0.013695240020751953, -0.012272834777832031, -0.01085042953491211, -0.009428024291992188, -0.008005619049072266, -0.006583213806152344, -0.005160808563232422, -0.0037384033203125, -0.002315998077392578, -0.0008935928344726562, 0.0005288124084472656, 0.0019512176513671875, 0.0033736228942871094, 0.004796028137207031, 0.006218433380126953, 0.007640838623046875, 0.009063243865966797, 0.010485649108886719, 0.01190805435180664, 0.013330459594726562, 0.014752864837646484, 0.016175270080566406, 0.017597675323486328, 0.01902008056640625, 0.020442485809326172, 0.021864891052246094, 0.023287296295166016, 0.024709701538085938, 0.02613210678100586, 0.02755451202392578, 0.028976917266845703, 0.030399322509765625, 0.03182172775268555, 0.03324413299560547, 0.03466653823852539, 0.03608894348144531, 0.037511348724365234, 0.038933753967285156, 0.04035615921020508, 0.041778564453125]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 6.0, 3.0, 2.0, 9.0, 7.0, 8.0, 9.0, 15.0, 8.0, 38.0, 33.0, 64.0, 82.0, 138.0, 148.0, 133.0, 92.0, 48.0, 35.0, 28.0, 26.0, 13.0, 13.0, 10.0, 6.0, 11.0, 1.0, 3.0, 2.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0826416015625, -0.08043527603149414, -0.07822895050048828, -0.07602262496948242, -0.07381629943847656, -0.0716099739074707, -0.06940364837646484, -0.06719732284545898, -0.06499099731445312, -0.06278467178344727, -0.060578346252441406, -0.05837202072143555, -0.05616569519042969, -0.05395936965942383, -0.05175304412841797, -0.04954671859741211, -0.04734039306640625, -0.04513406753540039, -0.04292774200439453, -0.04072141647338867, -0.03851509094238281, -0.03630876541137695, -0.034102439880371094, -0.031896114349365234, -0.029689788818359375, -0.027483463287353516, -0.025277137756347656, -0.023070812225341797, -0.020864486694335938, -0.018658161163330078, -0.01645183563232422, -0.01424551010131836, -0.0120391845703125, -0.00983285903930664, -0.007626533508300781, -0.005420207977294922, -0.0032138824462890625, -0.0010075569152832031, 0.0011987686157226562, 0.0034050941467285156, 0.005611419677734375, 0.007817745208740234, 0.010024070739746094, 0.012230396270751953, 0.014436721801757812, 0.016643047332763672, 0.01884937286376953, 0.02105569839477539, 0.02326202392578125, 0.02546834945678711, 0.02767467498779297, 0.029881000518798828, 0.03208732604980469, 0.03429365158081055, 0.036499977111816406, 0.038706302642822266, 0.040912628173828125, 0.043118953704833984, 0.045325279235839844, 0.0475316047668457, 0.04973793029785156, 0.05194425582885742, 0.05415058135986328, 0.05635690689086914, 0.058563232421875]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 6.0, 20.0, 35.0, 123.0, 607.0, 123.0, 51.0, 17.0, 5.0, 10.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.086722373962402, -6.946247100830078, -6.805771827697754, -6.66529655456543, -6.5248212814331055, -6.384346008300781, -6.243870735168457, -6.103395462036133, -5.962920188903809, -5.822444915771484, -5.68196964263916, -5.541494369506836, -5.401019096374512, -5.2605438232421875, -5.120068550109863, -4.979593276977539, -4.839118003845215, -4.698642730712891, -4.558167457580566, -4.417692184448242, -4.277216911315918, -4.136741638183594, -3.9962663650512695, -3.8557910919189453, -3.7153162956237793, -3.574841022491455, -3.434365749359131, -3.2938904762268066, -3.1534152030944824, -3.012939929962158, -2.872464656829834, -2.7319893836975098, -2.5915143489837646, -2.4510390758514404, -2.310563802719116, -2.170088529586792, -2.0296132564544678, -1.8891379833221436, -1.7486628293991089, -1.6081875562667847, -1.4677122831344604, -1.3272370100021362, -1.186761736869812, -1.0462865829467773, -0.9058112502098083, -0.7653359770774841, -0.6248607635498047, -0.48438549041748047, -0.34391021728515625, -0.20343495905399323, -0.0629597008228302, 0.07751554250717163, 0.21799081563949585, 0.35846608877182007, 0.4989413022994995, 0.6394165754318237, 0.779891848564148, 0.9203671216964722, 1.0608423948287964, 1.201317548751831, 1.3417928218841553, 1.4822680950164795, 1.6227433681488037, 1.763218641281128, 1.9036939144134521]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 3.0, 1.0, 3.0, 6.0, 11.0, 9.0, 14.0, 19.0, 16.0, 21.0, 31.0, 34.0, 40.0, 77.0, 273.0, 200.0, 50.0, 33.0, 28.0, 25.0, 22.0, 18.0, 17.0, 11.0, 8.0, 10.0, 7.0, 5.0, 0.0, 8.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.076354742050171, -1.9853906631469727, -1.8944265842437744, -1.8034626245498657, -1.7124985456466675, -1.6215344667434692, -1.5305705070495605, -1.4396064281463623, -1.348642349243164, -1.2576782703399658, -1.1667141914367676, -1.0757502317428589, -0.9847861528396606, -0.8938220739364624, -0.8028580546379089, -0.7118940353393555, -0.6209299564361572, -0.529965877532959, -0.4390018582344055, -0.34803780913352966, -0.2570737600326538, -0.16610971093177795, -0.0751456618309021, 0.015818357467651367, 0.10678243637084961, 0.19774648547172546, 0.2887105345726013, 0.3796745836734772, 0.470638632774353, 0.5616027116775513, 0.6525667309761047, 0.7435307502746582, 0.8344945907592773, 0.9254586696624756, 1.0164227485656738, 1.1073867082595825, 1.1983507871627808, 1.289314866065979, 1.3802788257598877, 1.471242904663086, 1.5622069835662842, 1.6531710624694824, 1.7441351413726807, 1.8350991010665894, 1.9260631799697876, 2.0170271396636963, 2.1079912185668945, 2.1989552974700928, 2.289919376373291, 2.3808834552764893, 2.4718475341796875, 2.5628116130828857, 2.653775691986084, 2.744739532470703, 2.8357036113739014, 2.9266676902770996, 3.017631769180298, 3.108595848083496, 3.1995599269866943, 3.2905240058898926, 3.3814878463745117, 3.47245192527771, 3.563416004180908, 3.6543800830841064, 3.7453441619873047]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 2.0, 3.0, 2.0, 2.0, 7.0, 11.0, 8.0, 12.0, 16.0, 17.0, 19.0, 22.0, 30.0, 50.0, 37.0, 43.0, 67.0, 214.0, 119.0, 53.0, 36.0, 40.0, 34.0, 28.0, 20.0, 26.0, 21.0, 17.0, 10.0, 11.0, 4.0, 4.0, 6.0, 4.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1778564453125, -0.17206764221191406, -0.16627883911132812, -0.1604900360107422, -0.15470123291015625, -0.1489124298095703, -0.14312362670898438, -0.13733482360839844, -0.1315460205078125, -0.12575721740722656, -0.11996841430664062, -0.11417961120605469, -0.10839080810546875, -0.10260200500488281, -0.09681320190429688, -0.09102439880371094, -0.085235595703125, -0.07944679260253906, -0.07365798950195312, -0.06786918640136719, -0.06208038330078125, -0.05629158020019531, -0.050502777099609375, -0.04471397399902344, -0.0389251708984375, -0.03313636779785156, -0.027347564697265625, -0.021558761596679688, -0.01576995849609375, -0.009981155395507812, -0.004192352294921875, 0.0015964508056640625, 0.00738525390625, 0.013174057006835938, 0.018962860107421875, 0.024751663208007812, 0.03054046630859375, 0.03632926940917969, 0.042118072509765625, 0.04790687561035156, 0.0536956787109375, 0.05948448181152344, 0.06527328491210938, 0.07106208801269531, 0.07685089111328125, 0.08263969421386719, 0.08842849731445312, 0.09421730041503906, 0.100006103515625, 0.10579490661621094, 0.11158370971679688, 0.11737251281738281, 0.12316131591796875, 0.1289501190185547, 0.13473892211914062, 0.14052772521972656, 0.1463165283203125, 0.15210533142089844, 0.15789413452148438, 0.1636829376220703, 0.16947174072265625, 0.1752605438232422, 0.18104934692382812, 0.18683815002441406, 0.192626953125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 7.0, 12.0, 2.0, 1.0, 7.0, 9.0, 14.0, 17.0, 45.0, 50.0, 77.0, 167.0, 379.0, 1301.0, 10077.0, 8362151.0, 12084.0, 1435.0, 374.0, 154.0, 79.0, 55.0, 23.0, 21.0, 14.0, 9.0, 13.0, 5.0, 6.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7340997457504272, -1.6687462329864502, -1.6033926010131836, -1.5380390882492065, -1.4726855754852295, -1.4073320627212524, -1.3419785499572754, -1.2766249179840088, -1.2112714052200317, -1.1459178924560547, -1.080564260482788, -1.015210747718811, -0.949857234954834, -0.8845037221908569, -0.8191501498222351, -0.7537965774536133, -0.6884430646896362, -0.6230895519256592, -0.5577359795570374, -0.4923824369907379, -0.4270288944244385, -0.36167535185813904, -0.2963218092918396, -0.23096826672554016, -0.16561472415924072, -0.10026118159294128, -0.034907639026641846, 0.030445903539657593, 0.09579944610595703, 0.16115298867225647, 0.2265065312385559, 0.29186007380485535, 0.35721349716186523, 0.4225670397281647, 0.4879205822944641, 0.5532741546630859, 0.618627667427063, 0.68398118019104, 0.7493347525596619, 0.8146883249282837, 0.8800418376922607, 0.9453953504562378, 1.0107488632202148, 1.0761024951934814, 1.1414560079574585, 1.2068095207214355, 1.2721631526947021, 1.3375166654586792, 1.4028701782226562, 1.4682236909866333, 1.5335772037506104, 1.598930835723877, 1.664284348487854, 1.729637861251831, 1.7949914932250977, 1.8603450059890747, 1.9256985187530518, 1.9910520315170288, 2.056405544281006, 2.1217591762542725, 2.187112808227539, 2.2524662017822266, 2.317819833755493, 2.3831732273101807, 2.4485268592834473]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 1.0, 3.0, 2.0, 4.0, 4.0, 6.0, 4.0, 1.0, 8.0, 1.0, 5.0, 7.0, 8.0, 4.0, 6.0, 1.0, 3.0, 7.0, 5.0, 4.0, 2.0, 3.0, 1.0, 3.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.914140224456787, -2.838815212249756, -2.7634899616241455, -2.688164710998535, -2.612839698791504, -2.5375146865844727, -2.4621894359588623, -2.386864185333252, -2.3115391731262207, -2.2362141609191895, -2.160888910293579, -2.0855636596679688, -2.0102386474609375, -1.9349135160446167, -1.859588384628296, -1.784263253211975, -1.7089381217956543, -1.6336129903793335, -1.5582878589630127, -1.482962727546692, -1.407637596130371, -1.3323124647140503, -1.2569873332977295, -1.1816622018814087, -1.106337070465088, -1.031011939048767, -0.9556868076324463, -0.8803616762161255, -0.8050365447998047, -0.7297114133834839, -0.6543862819671631, -0.5790611505508423, -0.5037362575531006, -0.4284111261367798, -0.353085994720459, -0.2777608633041382, -0.20243573188781738, -0.12711060047149658, -0.05178546905517578, 0.02353966236114502, 0.09886479377746582, 0.17418992519378662, 0.24951505661010742, 0.3248401880264282, 0.400165319442749, 0.4754904508590698, 0.5508155822753906, 0.6261407136917114, 0.7014658451080322, 0.776790976524353, 0.8521161079406738, 0.9274412393569946, 1.0027663707733154, 1.0780915021896362, 1.153416633605957, 1.2287417650222778, 1.3040668964385986, 1.3793920278549194, 1.4547171592712402, 1.530042290687561, 1.6053674221038818, 1.6806925535202026, 1.7560176849365234, 1.8313428163528442, 1.906667947769165]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 7.0, 8.0, 5.0, 7.0, 5.0, 14.0, 25.0, 14.0, 27.0, 40.0, 53.0, 48.0, 70.0, 51.0, 75.0, 78.0, 81.0, 67.0, 58.0, 56.0, 53.0, 33.0, 35.0, 22.0, 16.0, 11.0, 10.0, 6.0, 9.0, 5.0, 4.0, 2.0, 2.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08343505859375, -0.08044052124023438, -0.07744598388671875, -0.07445144653320312, -0.0714569091796875, -0.06846237182617188, -0.06546783447265625, -0.062473297119140625, -0.059478759765625, -0.056484222412109375, -0.05348968505859375, -0.050495147705078125, -0.0475006103515625, -0.044506072998046875, -0.04151153564453125, -0.038516998291015625, -0.0355224609375, -0.032527923583984375, -0.02953338623046875, -0.026538848876953125, -0.0235443115234375, -0.020549774169921875, -0.01755523681640625, -0.014560699462890625, -0.011566162109375, -0.008571624755859375, -0.00557708740234375, -0.002582550048828125, 0.0004119873046875, 0.003406524658203125, 0.00640106201171875, 0.009395599365234375, 0.01239013671875, 0.015384674072265625, 0.01837921142578125, 0.021373748779296875, 0.0243682861328125, 0.027362823486328125, 0.03035736083984375, 0.033351898193359375, 0.036346435546875, 0.039340972900390625, 0.04233551025390625, 0.045330047607421875, 0.0483245849609375, 0.051319122314453125, 0.05431365966796875, 0.057308197021484375, 0.060302734375, 0.06329727172851562, 0.06629180908203125, 0.06928634643554688, 0.0722808837890625, 0.07527542114257812, 0.07826995849609375, 0.08126449584960938, 0.084259033203125, 0.08725357055664062, 0.09024810791015625, 0.09324264526367188, 0.0962371826171875, 0.09923171997070312, 0.10222625732421875, 0.10522079467773438, 0.10821533203125]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 4.0, 4.0, 6.0, 2.0, 10.0, 8.0, 20.0, 20.0, 26.0, 22.0, 60.0, 55.0, 106.0, 176.0, 286.0, 510.0, 1073.0, 2428.0, 6607.0, 19003.0, 61506.0, 180164.0, 168314.0, 55537.0, 17535.0, 6069.0, 2389.0, 1041.0, 524.0, 260.0, 151.0, 91.0, 76.0, 52.0, 33.0, 28.0, 16.0, 13.0, 12.0, 11.0, 6.0, 3.0, 4.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.087890625, -1.0538482666015625, -1.019805908203125, -0.9857635498046875, -0.95172119140625, -0.9176788330078125, -0.883636474609375, -0.8495941162109375, -0.8155517578125, -0.7815093994140625, -0.747467041015625, -0.7134246826171875, -0.67938232421875, -0.6453399658203125, -0.611297607421875, -0.5772552490234375, -0.543212890625, -0.5091705322265625, -0.475128173828125, -0.4410858154296875, -0.40704345703125, -0.3730010986328125, -0.338958740234375, -0.3049163818359375, -0.2708740234375, -0.2368316650390625, -0.202789306640625, -0.1687469482421875, -0.13470458984375, -0.1006622314453125, -0.066619873046875, -0.0325775146484375, 0.00146484375, 0.0355072021484375, 0.069549560546875, 0.1035919189453125, 0.13763427734375, 0.1716766357421875, 0.205718994140625, 0.2397613525390625, 0.2738037109375, 0.3078460693359375, 0.341888427734375, 0.3759307861328125, 0.40997314453125, 0.4440155029296875, 0.478057861328125, 0.5121002197265625, 0.546142578125, 0.5801849365234375, 0.614227294921875, 0.6482696533203125, 0.68231201171875, 0.7163543701171875, 0.750396728515625, 0.7844390869140625, 0.8184814453125, 0.8525238037109375, 0.886566162109375, 0.9206085205078125, 0.95465087890625, 0.9886932373046875, 1.022735595703125, 1.0567779541015625, 1.0908203125]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 8.0, 7.0, 8.0, 12.0, 12.0, 17.0, 28.0, 39.0, 60.0, 58.0, 67.0, 108.0, 119.0, 107.0, 80.0, 69.0, 55.0, 43.0, 25.0, 26.0, 17.0, 12.0, 7.0, 8.0, 3.0, 4.0, 1.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.23291015625, -0.22381210327148438, -0.21471405029296875, -0.20561599731445312, -0.1965179443359375, -0.18741989135742188, -0.17832183837890625, -0.16922378540039062, -0.160125732421875, -0.15102767944335938, -0.14192962646484375, -0.13283157348632812, -0.1237335205078125, -0.11463546752929688, -0.10553741455078125, -0.09643936157226562, -0.08734130859375, -0.07824325561523438, -0.06914520263671875, -0.060047149658203125, -0.0509490966796875, -0.041851043701171875, -0.03275299072265625, -0.023654937744140625, -0.014556884765625, -0.005458831787109375, 0.00363922119140625, 0.012737274169921875, 0.0218353271484375, 0.030933380126953125, 0.04003143310546875, 0.049129486083984375, 0.0582275390625, 0.06732559204101562, 0.07642364501953125, 0.08552169799804688, 0.0946197509765625, 0.10371780395507812, 0.11281585693359375, 0.12191390991210938, 0.131011962890625, 0.14011001586914062, 0.14920806884765625, 0.15830612182617188, 0.1674041748046875, 0.17650222778320312, 0.18560028076171875, 0.19469833374023438, 0.20379638671875, 0.21289443969726562, 0.22199249267578125, 0.23109054565429688, 0.2401885986328125, 0.24928665161132812, 0.25838470458984375, 0.2674827575683594, 0.276580810546875, 0.2856788635253906, 0.29477691650390625, 0.3038749694824219, 0.3129730224609375, 0.3220710754394531, 0.33116912841796875, 0.3402671813964844, 0.349365234375]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 1.0, 3.0, 7.0, 10.0, 17.0, 32.0, 51.0, 99.0, 104.0, 64.0, 51.0, 18.0, 9.0, 6.0, 7.0, 3.0, 7.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9511016607284546, -0.8965842127799988, -0.8420668244361877, -0.7875493764877319, -0.7330319881439209, -0.6785145401954651, -0.6239970922470093, -0.5694797039031982, -0.5149622559547424, -0.460444837808609, -0.4059274196624756, -0.3514099717140198, -0.29689255356788635, -0.24237513542175293, -0.18785768747329712, -0.1333402693271637, -0.07882285118103027, -0.024305425584316254, 0.030212000012397766, 0.08472943305969238, 0.1392468512058258, 0.19376426935195923, 0.24828171730041504, 0.30279913544654846, 0.3573165535926819, 0.4118339717388153, 0.46635138988494873, 0.5208688378334045, 0.5753862857818604, 0.6299036741256714, 0.6844211220741272, 0.738938570022583, 0.7934558391571045, 0.8479732871055603, 0.9024906754493713, 0.9570081233978271, 1.0115255117416382, 1.0660429000854492, 1.1205604076385498, 1.1750777959823608, 1.2295951843261719, 1.284112572669983, 1.3386300802230835, 1.3931474685668945, 1.4476648569107056, 1.5021822452545166, 1.5566997528076172, 1.6112171411514282, 1.6657346487045288, 1.7202520370483398, 1.7747695446014404, 1.8292869329452515, 1.8838043212890625, 1.938321828842163, 1.9928392171859741, 2.047356605529785, 2.1018741130828857, 2.1563916206359863, 2.210908889770508, 2.2654263973236084, 2.319943904876709, 2.3744611740112305, 2.428978681564331, 2.4834961891174316, 2.538013458251953]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 6.0, 0.0, 5.0, 3.0, 1.0, 2.0, 5.0, 10.0, 4.0, 13.0, 23.0, 20.0, 49.0, 70.0, 76.0, 66.0, 35.0, 35.0, 19.0, 12.0, 9.0, 6.0, 6.0, 4.0, 2.0, 4.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2129456996917725, -1.1660399436950684, -1.1191341876983643, -1.0722284317016602, -1.025322675704956, -0.9784169793128967, -0.9315112829208374, -0.8846055269241333, -0.8376997709274292, -0.7907940149307251, -0.743888258934021, -0.6969825625419617, -0.6500768065452576, -0.6031710505485535, -0.5562653541564941, -0.50935959815979, -0.46245384216308594, -0.41554808616638184, -0.3686423599720001, -0.3217366337776184, -0.2748308777809143, -0.2279251366853714, -0.1810193955898285, -0.13411366939544678, -0.08720791339874268, -0.04030217230319977, 0.00660356879234314, 0.05350930988788605, 0.10041505098342896, 0.14732079207897186, 0.19422653317451477, 0.24113225936889648, 0.28803789615631104, 0.33494365215301514, 0.38184937834739685, 0.42875510454177856, 0.47566086053848267, 0.5225666165351868, 0.5694723129272461, 0.6163780689239502, 0.6632838249206543, 0.7101895809173584, 0.7570953369140625, 0.8040010333061218, 0.8509067893028259, 0.89781254529953, 0.9447182416915894, 0.9916239976882935, 1.0385297536849976, 1.0854355096817017, 1.1323412656784058, 1.1792470216751099, 1.2261526584625244, 1.2730584144592285, 1.3199641704559326, 1.3668699264526367, 1.4137756824493408, 1.460681438446045, 1.507587194442749, 1.5544929504394531, 1.6013987064361572, 1.6483043432235718, 1.6952100992202759, 1.74211585521698, 1.789021611213684]}, "eval/loss": 4.050220966339111, "eval/wer": 1.7867314557715193, "eval/runtime": 594.0081, "eval/samples_per_second": 4.448, "eval/steps_per_second": 0.557} \ No newline at end of file